ImBuf: Performance IMB_transform.

This change uses generics to reduce code duplication an increases
flexibility and performance. Performance increase isn't measurable
for end users.
This commit is contained in:
Jeroen Bakker 2021-12-08 13:00:34 +01:00
parent 32b1a13fa1
commit 8f1997975d
1 changed files with 99 additions and 152 deletions

View File

@ -29,25 +29,6 @@
namespace blender::imbuf::transform {
/* -------------------------------------------------------------------- */
/** \name Image transform
* \{ */
static void pixel_from_buffer(
const struct ImBuf *ibuf, unsigned char **outI, float **outF, int x, int y)
{
size_t offset = ((size_t)ibuf->x) * y * 4 + 4 * x;
if (ibuf->rect) {
*outI = (unsigned char *)ibuf->rect + offset;
}
if (ibuf->rect_float) {
*outF = ibuf->rect_float + offset;
}
}
struct TransformUserData {
const ImBuf *src;
ImBuf *dst;
@ -56,6 +37,14 @@ struct TransformUserData {
float add_y[2];
rctf src_crop;
void init(const float transform_matrix[4][4])
{
init_start_uv(transform_matrix);
init_add_x(transform_matrix);
init_add_y(transform_matrix);
}
private:
void init_start_uv(const float transform_matrix[4][4])
{
float start_uv_v3[3];
@ -65,8 +54,9 @@ struct TransformUserData {
copy_v2_v2(start_uv, start_uv_v3);
}
void init_add_x(const float transform_matrix[4][4], const int width)
void init_add_x(const float transform_matrix[4][4])
{
const int width = src->x;
float add_x_v3[3];
float uv_max_x[3];
zero_v3(uv_max_x);
@ -78,8 +68,9 @@ struct TransformUserData {
copy_v2_v2(add_x, add_x_v3);
}
void init_add_y(const float transform_matrix[4][4], const int height)
void init_add_y(const float transform_matrix[4][4])
{
const int height = src->y;
float add_y_v3[3];
float uv_max_y[3];
zero_v3(uv_max_y);
@ -92,152 +83,106 @@ struct TransformUserData {
}
};
BLI_INLINE void imb_transform_scanlines(const TransformUserData *user_data,
int scanline,
InterpolationColorFunction interpolation)
{
const int width = user_data->dst->x;
template<eIMBTransformMode Mode, InterpolationColorFunction ColorInterpolation, int ChannelLen = 4>
class ScanlineProcessor {
private:
void pixel_from_buffer(const struct ImBuf *ibuf, unsigned char **outI, float **outF, int y) const
float uv[2];
madd_v2_v2v2fl(uv, user_data->start_uv, user_data->add_y, scanline);
{
const size_t offset = ((size_t)ibuf->x) * y * ChannelLen;
unsigned char *outI = nullptr;
float *outF = nullptr;
pixel_from_buffer(user_data->dst, &outI, &outF, 0, scanline);
for (int xi = 0; xi < width; xi++) {
interpolation(user_data->src, outI, outF, uv[0], uv[1]);
add_v2_v2(uv, user_data->add_x);
if (outI) {
outI += 4;
if (ibuf->rect) {
*outI = (unsigned char *)ibuf->rect + offset;
}
if (outF) {
outF += 4;
if (ibuf->rect_float) {
*outF = ibuf->rect_float + offset;
}
}
}
static void imb_transform_nearest_scanlines(void *custom_data, int scanline)
{
const TransformUserData *user_data = static_cast<const TransformUserData *>(custom_data);
InterpolationColorFunction interpolation = nullptr;
if (user_data->dst->rect_float) {
interpolation = nearest_interpolation_color_fl;
}
else {
interpolation = nearest_interpolation_color_char;
}
imb_transform_scanlines(user_data, scanline, interpolation);
}
public:
void process(const TransformUserData *user_data, int scanline)
{
const int width = user_data->dst->x;
static void imb_transform_bilinear_scanlines(void *custom_data, int scanline)
{
const TransformUserData *user_data = static_cast<const TransformUserData *>(custom_data);
InterpolationColorFunction interpolation = nullptr;
if (user_data->dst->rect_float) {
interpolation = bilinear_interpolation_color_fl;
}
else if (user_data->dst->rect) {
interpolation = bilinear_interpolation_color_char;
}
imb_transform_scanlines(user_data, scanline, interpolation);
}
float uv[2];
madd_v2_v2v2fl(uv, user_data->start_uv, user_data->add_y, scanline);
BLI_INLINE void imb_transform_scanlines_with_crop(const TransformUserData *user_data,
int scanline,
InterpolationColorFunction interpolation)
{
const int width = user_data->dst->x;
unsigned char *outI = nullptr;
float *outF = nullptr;
pixel_from_buffer(user_data->dst, &outI, &outF, scanline);
float uv[2];
madd_v2_v2v2fl(uv, user_data->start_uv, user_data->add_y, scanline);
unsigned char *outI = nullptr;
float *outF = nullptr;
pixel_from_buffer(user_data->dst, &outI, &outF, 0, scanline);
for (int xi = 0; xi < width; xi++) {
if (uv[0] >= user_data->src_crop.xmin && uv[0] < user_data->src_crop.xmax &&
uv[1] >= user_data->src_crop.ymin && uv[1] < user_data->src_crop.ymax) {
interpolation(user_data->src, outI, outF, uv[0], uv[1]);
}
add_v2_v2(uv, user_data->add_x);
if (outI) {
outI += 4;
}
if (outF) {
outF += 4;
for (int xi = 0; xi < width; xi++) {
if constexpr (Mode == IMB_TRANSFORM_MODE_CROP_SRC) {
if (uv[0] >= user_data->src_crop.xmin && uv[0] < user_data->src_crop.xmax &&
uv[1] >= user_data->src_crop.ymin && uv[1] < user_data->src_crop.ymax) {
ColorInterpolation(user_data->src, outI, outF, uv[0], uv[1]);
}
}
else {
ColorInterpolation(user_data->src, outI, outF, uv[0], uv[1]);
}
add_v2_v2(uv, user_data->add_x);
if (outI) {
outI += ChannelLen;
}
if (outF) {
outF += ChannelLen;
}
}
}
}
};
static void imb_transform_nearest_scanlines_with_crop(void *custom_data, int scanline)
template<typename Processor> void transform_scanline_function(void *custom_data, int scanline)
{
const TransformUserData *user_data = static_cast<const TransformUserData *>(custom_data);
InterpolationColorFunction interpolation = nullptr;
if (user_data->dst->rect_float) {
interpolation = nearest_interpolation_color_fl;
}
else {
interpolation = nearest_interpolation_color_char;
}
imb_transform_scanlines_with_crop(user_data, scanline, interpolation);
Processor processor;
processor.process(user_data, scanline);
}
static void imb_transform_bilinear_scanlines_with_crop(void *custom_data, int scanline)
{
const TransformUserData *user_data = static_cast<const TransformUserData *>(custom_data);
InterpolationColorFunction interpolation = nullptr;
if (user_data->dst->rect_float) {
interpolation = bilinear_interpolation_color_fl;
}
else if (user_data->dst->rect) {
interpolation = bilinear_interpolation_color_char;
}
imb_transform_scanlines_with_crop(user_data, scanline, interpolation);
}
template<InterpolationColorFunction DefaultFunction, InterpolationColorFunction WrapRepeatFunction>
ScanlineThreadFunc get_scanline_function(const eIMBTransformMode mode)
static void imb_transform_nearest_scanlines_with_repeat(void *custom_data, int scanline)
{
const TransformUserData *user_data = static_cast<const TransformUserData *>(custom_data);
InterpolationColorFunction interpolation = nearest_interpolation_color_wrap;
imb_transform_scanlines(user_data, scanline, interpolation);
}
static ScanlineThreadFunc imb_transform_scanline_func(const eIMBInterpolationFilterMode filter,
const eIMBTransformMode mode)
{
ScanlineThreadFunc scanline_func = nullptr;
switch (mode) {
case IMB_TRANSFORM_MODE_REGULAR:
switch (filter) {
case IMB_FILTER_NEAREST:
scanline_func = imb_transform_nearest_scanlines;
break;
case IMB_FILTER_BILINEAR:
scanline_func = imb_transform_bilinear_scanlines;
break;
}
break;
return transform_scanline_function<
ScanlineProcessor<IMB_TRANSFORM_MODE_REGULAR, DefaultFunction>>;
case IMB_TRANSFORM_MODE_CROP_SRC:
switch (filter) {
case IMB_FILTER_NEAREST:
scanline_func = imb_transform_nearest_scanlines_with_crop;
break;
case IMB_FILTER_BILINEAR:
scanline_func = imb_transform_bilinear_scanlines_with_crop;
break;
}
break;
return transform_scanline_function<
ScanlineProcessor<IMB_TRANSFORM_MODE_CROP_SRC, DefaultFunction>>;
case IMB_TRANSFORM_MODE_WRAP_REPEAT:
BLI_assert_msg(filter == IMB_FILTER_NEAREST,
"Repeat mode is only supported with nearest interpolation.");
scanline_func = imb_transform_nearest_scanlines_with_repeat;
break;
return transform_scanline_function<
ScanlineProcessor<IMB_TRANSFORM_MODE_WRAP_REPEAT, WrapRepeatFunction>>;
}
BLI_assert_unreachable();
return nullptr;
}
template<eIMBInterpolationFilterMode Filter>
static void transform(TransformUserData *user_data, const eIMBTransformMode mode)
{
ScanlineThreadFunc scanline_func = nullptr;
if (user_data->dst->rect_float) {
constexpr InterpolationColorFunction interpolation_function =
Filter == IMB_FILTER_NEAREST ? nearest_interpolation_color_fl :
bilinear_interpolation_color_fl;
scanline_func =
get_scanline_function<interpolation_function, nearest_interpolation_color_wrap>(mode);
}
else if (user_data->dst->rect) {
constexpr InterpolationColorFunction interpolation_function =
Filter == IMB_FILTER_NEAREST ? nearest_interpolation_color_char :
bilinear_interpolation_color_char;
scanline_func =
get_scanline_function<interpolation_function, nearest_interpolation_color_wrap>(mode);
}
if (scanline_func != nullptr) {
IMB_processor_apply_threaded_scanlines(user_data->dst->y, scanline_func, user_data);
}
return scanline_func;
}
} // namespace blender::imbuf::transform
@ -256,18 +201,20 @@ void IMB_transform(const struct ImBuf *src,
BLI_assert_msg(mode != IMB_TRANSFORM_MODE_CROP_SRC || src_crop != nullptr,
"No source crop rect given, but crop source is requested. Or source crop rect "
"was given, but crop source was not requested.");
TransformUserData user_data;
user_data.src = src;
user_data.dst = dst;
if (mode == IMB_TRANSFORM_MODE_CROP_SRC) {
user_data.src_crop = *src_crop;
}
user_data.init_start_uv(transform_matrix);
user_data.init_add_x(transform_matrix, src->x);
user_data.init_add_y(transform_matrix, src->y);
ScanlineThreadFunc scanline_func = imb_transform_scanline_func(filter, mode);
IMB_processor_apply_threaded_scanlines(dst->y, scanline_func, &user_data);
}
}
user_data.init(transform_matrix);
/** \} */
if (filter == IMB_FILTER_NEAREST) {
transform<IMB_FILTER_NEAREST>(&user_data, mode);
}
else {
transform<IMB_FILTER_BILINEAR>(&user_data, mode);
}
}
}