mirror of
https://gitlab.freedesktop.org/mesa/mesa.git
synced 2026-02-18 12:40:31 +01:00
radeon: add software untiling functions
This commit is contained in:
parent
65faa27aa6
commit
5fefca5dba
2 changed files with 225 additions and 0 deletions
|
|
@ -245,6 +245,227 @@ void tile_image(const void * src, unsigned src_pitch,
|
|||
}
|
||||
}
|
||||
|
||||
static void micro_untile_8_x_4_8bit(const void * const src, unsigned src_pitch,
|
||||
void * const dst, unsigned dst_pitch,
|
||||
unsigned width, unsigned height)
|
||||
{
|
||||
unsigned row; /* current destination row */
|
||||
unsigned col; /* current destination column */
|
||||
unsigned k; /* current tile number */
|
||||
const unsigned tile_width = 8, tile_height = 4;
|
||||
const unsigned tiles_in_row = (width + (tile_width - 1)) / tile_width;
|
||||
|
||||
assert(src_pitch % tile_width == 0);
|
||||
|
||||
k = 0;
|
||||
for (row = 0; row < height; row += tile_height)
|
||||
{
|
||||
for (col = 0; col < width; col += tile_width, ++k)
|
||||
{
|
||||
uint8_t *src2 = (uint8_t *)src + row * src_pitch +
|
||||
(k % tiles_in_row) * MICRO_TILE_SIZE / sizeof(uint8_t);
|
||||
uint8_t *dst2 = (uint8_t *)dst + dst_pitch * row + col;
|
||||
unsigned j;
|
||||
|
||||
for (j = 0; j < MIN2(tile_height, height - row); ++j)
|
||||
{
|
||||
unsigned columns = MIN2(tile_width, width - col);
|
||||
memcpy(dst2, src2, columns * sizeof(uint8_t));
|
||||
dst2 += dst_pitch;
|
||||
src2 += tile_width;
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
static void micro_untile_8_x_2_16bit(const void * const src, unsigned src_pitch,
|
||||
void * const dst, unsigned dst_pitch,
|
||||
unsigned width, unsigned height)
|
||||
{
|
||||
unsigned row; /* current destination row */
|
||||
unsigned col; /* current destination column */
|
||||
unsigned k; /* current tile number */
|
||||
const unsigned tile_width = 8, tile_height = 2;
|
||||
const unsigned tiles_in_row = (width + (tile_width - 1)) / tile_width;
|
||||
|
||||
assert(src_pitch % tile_width == 0);
|
||||
|
||||
k = 0;
|
||||
for (row = 0; row < height; row += tile_height)
|
||||
{
|
||||
for (col = 0; col < width; col += tile_width, ++k)
|
||||
{
|
||||
uint16_t *src2 = (uint16_t *)src + row * src_pitch +
|
||||
(k % tiles_in_row) * MICRO_TILE_SIZE / sizeof(uint16_t);
|
||||
uint16_t *dst2 = (uint16_t *)dst + dst_pitch * row + col;
|
||||
unsigned j;
|
||||
|
||||
for (j = 0; j < MIN2(tile_height, height - row); ++j)
|
||||
{
|
||||
unsigned columns = MIN2(tile_width, width - col);
|
||||
memcpy(dst2, src2, columns * sizeof(uint16_t));
|
||||
dst2 += dst_pitch;
|
||||
src2 += tile_width;
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
static void micro_untile_4_x_4_16bit(const void * const src, unsigned src_pitch,
|
||||
void * const dst, unsigned dst_pitch,
|
||||
unsigned width, unsigned height)
|
||||
{
|
||||
unsigned row; /* current destination row */
|
||||
unsigned col; /* current destination column */
|
||||
unsigned k; /* current tile number */
|
||||
const unsigned tile_width = 4, tile_height = 4;
|
||||
const unsigned tiles_in_row = (width + (tile_width - 1)) / tile_width;
|
||||
|
||||
assert(src_pitch % tile_width == 0);
|
||||
|
||||
k = 0;
|
||||
for (row = 0; row < height; row += tile_height)
|
||||
{
|
||||
for (col = 0; col < width; col += tile_width, ++k)
|
||||
{
|
||||
uint16_t *src2 = (uint16_t *)src + row * src_pitch +
|
||||
(k % tiles_in_row) * MICRO_TILE_SIZE / sizeof(uint16_t);
|
||||
uint16_t *dst2 = (uint16_t *)dst + dst_pitch * row + col;
|
||||
unsigned j;
|
||||
|
||||
for (j = 0; j < MIN2(tile_height, height - row); ++j)
|
||||
{
|
||||
unsigned columns = MIN2(tile_width, width - col);
|
||||
memcpy(dst2, src2, columns * sizeof(uint16_t));
|
||||
dst2 += dst_pitch;
|
||||
src2 += tile_width;
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
static void micro_untile_4_x_2_32bit(const void * const src, unsigned src_pitch,
|
||||
void * const dst, unsigned dst_pitch,
|
||||
unsigned width, unsigned height)
|
||||
{
|
||||
unsigned row; /* current destination row */
|
||||
unsigned col; /* current destination column */
|
||||
unsigned k; /* current tile number */
|
||||
const unsigned tile_width = 4, tile_height = 2;
|
||||
const unsigned tiles_in_row = (width + (tile_width - 1)) / tile_width;
|
||||
|
||||
assert(src_pitch % tile_width == 0);
|
||||
|
||||
k = 0;
|
||||
for (row = 0; row < height; row += tile_height)
|
||||
{
|
||||
for (col = 0; col < width; col += tile_width, ++k)
|
||||
{
|
||||
uint32_t *src2 = (uint32_t *)src + row * src_pitch +
|
||||
(k % tiles_in_row) * MICRO_TILE_SIZE / sizeof(uint32_t);
|
||||
uint32_t *dst2 = (uint32_t *)dst + dst_pitch * row + col;
|
||||
unsigned j;
|
||||
|
||||
for (j = 0; j < MIN2(tile_height, height - row); ++j)
|
||||
{
|
||||
unsigned columns = MIN2(tile_width, width - col);
|
||||
memcpy(dst2, src2, columns * sizeof(uint32_t));
|
||||
dst2 += dst_pitch;
|
||||
src2 += tile_width;
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
static void micro_untile_2_x_2_64bit(const void * const src, unsigned src_pitch,
|
||||
void * const dst, unsigned dst_pitch,
|
||||
unsigned width, unsigned height)
|
||||
{
|
||||
unsigned row; /* current destination row */
|
||||
unsigned col; /* current destination column */
|
||||
unsigned k; /* current tile number */
|
||||
const unsigned tile_width = 2, tile_height = 2;
|
||||
const unsigned tiles_in_row = (width + (tile_width - 1)) / tile_width;
|
||||
|
||||
assert(src_pitch % tile_width == 0);
|
||||
|
||||
k = 0;
|
||||
for (row = 0; row < height; row += tile_height)
|
||||
{
|
||||
for (col = 0; col < width; col += tile_width, ++k)
|
||||
{
|
||||
uint64_t *src2 = (uint64_t *)src + row * src_pitch +
|
||||
(k % tiles_in_row) * MICRO_TILE_SIZE / sizeof(uint64_t);
|
||||
uint64_t *dst2 = (uint64_t *)dst + dst_pitch * row + col;
|
||||
unsigned j;
|
||||
|
||||
for (j = 0; j < MIN2(tile_height, height - row); ++j)
|
||||
{
|
||||
unsigned columns = MIN2(tile_width, width - col);
|
||||
memcpy(dst2, src2, columns * sizeof(uint64_t));
|
||||
dst2 += dst_pitch;
|
||||
src2 += tile_width;
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
static void micro_untile_1_x_1_128bit(const void * src, unsigned src_pitch,
|
||||
void * dst, unsigned dst_pitch,
|
||||
unsigned width, unsigned height)
|
||||
{
|
||||
unsigned i, j;
|
||||
const unsigned elem_size = 16; /* sizeof(uint128_t) */
|
||||
|
||||
for (j = 0; j < height; ++j)
|
||||
{
|
||||
for (i = 0; i < width; ++i)
|
||||
{
|
||||
memcpy(dst, src, width * elem_size);
|
||||
dst += dst_pitch * elem_size;
|
||||
src += src_pitch * elem_size;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
void untile_image(const void * src, unsigned src_pitch,
|
||||
void *dst, unsigned dst_pitch,
|
||||
gl_format format, unsigned width, unsigned height)
|
||||
{
|
||||
assert(src_pitch >= width);
|
||||
assert(dst_pitch >= width);
|
||||
assert(src_pitch * _mesa_get_format_bytes(format) % MICRO_TILE_SIZE == 0);
|
||||
|
||||
switch (_mesa_get_format_bytes(format))
|
||||
{
|
||||
case 16:
|
||||
micro_untile_1_x_1_128bit(src, src_pitch, dst, dst_pitch, width, height);
|
||||
break;
|
||||
case 8:
|
||||
micro_untile_2_x_2_64bit(src, src_pitch, dst, dst_pitch, width, height);
|
||||
break;
|
||||
case 4:
|
||||
micro_untile_4_x_2_32bit(src, src_pitch, dst, dst_pitch, width, height);
|
||||
break;
|
||||
case 2:
|
||||
if (_mesa_get_format_bits(format, GL_DEPTH_BITS))
|
||||
{
|
||||
micro_untile_4_x_4_16bit(src, src_pitch, dst, dst_pitch, width, height);
|
||||
}
|
||||
else
|
||||
{
|
||||
micro_untile_8_x_2_16bit(src, src_pitch, dst, dst_pitch, width, height);
|
||||
}
|
||||
break;
|
||||
case 1:
|
||||
micro_untile_8_x_4_8bit(src, src_pitch, dst, dst_pitch, width, height);
|
||||
break;
|
||||
default:
|
||||
assert(0);
|
||||
break;
|
||||
}
|
||||
}
|
||||
|
||||
void get_tile_size(gl_format format, unsigned *block_width, unsigned *block_height)
|
||||
{
|
||||
switch (_mesa_get_format_bytes(format))
|
||||
|
|
|
|||
|
|
@ -31,4 +31,8 @@ void tile_image(const void * src, unsigned src_pitch,
|
|||
void *dst, unsigned dst_pitch,
|
||||
gl_format format, unsigned width, unsigned height);
|
||||
|
||||
void untile_image(const void * src, unsigned src_pitch,
|
||||
void *dst, unsigned dst_pitch,
|
||||
gl_format format, unsigned width, unsigned height);
|
||||
|
||||
void get_tile_size(gl_format format, unsigned *block_width, unsigned *block_height);
|
||||
|
|
|
|||
Loading…
Add table
Reference in a new issue