chromium/third_party/mediapipe/src/mediapipe/util/frame_buffer/halide/rgb_yuv_generator.cc

// Copyright 2023 The MediaPipe Authors.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//      http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#include "Halide.h"

namespace {

class RgbYuv : public Halide::Generator<RgbYuv> {
 public:
  Var x{"x"}, y{"y"}, c{"c"};

  // Input<Buffer> because that allows us to apply constraints on stride, etc.
  Input<Buffer<uint8_t, 3>> src_rgb{"rgb"};

  Output<Func> dst_y{"dst_y", UInt(8), 2};
  Output<Func> dst_uv{"dst_uv", UInt(8), 3};

  void generate();
  void schedule();
};

// Integer math versions of the full-range JFIF RGB-YUV coefficients.
//   Y =  0.2990*R + 0.5870*G + 0.1140*B
//   U = -0.1687*R - 0.3313*G + 0.5000*B + 128
//   V =  0.5000*R - 0.4187*G - 0.0813*B + 128
// See https://www.w3.org/Graphics/JPEG/jfif3.pdf. These coefficients are
// similar to, but not identical, to those used in Android.
Halide::Tuple rgbyuv(Halide::Expr r, Halide::Expr g, Halide::Expr b) {
  r = Halide::cast<int32_t>(r);
  g = Halide::cast<int32_t>(g);
  b = Halide::cast<int32_t>(b);
  return {
      (19595 * r + 38470 * g + 7474 * b + 32768) >> 16,
      ((-11056 * r - 21712 * g + 32768 * b + 32768) >> 16) + 128,
      ((32768 * r - 27440 * g - 5328 * b + 32768) >> 16) + 128,
  };
}

void RgbYuv::generate() {
  Halide::Func yuv_tuple("yuv_tuple");
  yuv_tuple(x, y) =
      rgbyuv(src_rgb(x, y, 0), src_rgb(x, y, 1), src_rgb(x, y, 2));

  // Y values are copied one-for-one; UV values are sampled 1/4.
  // TODO: Take the average UV values across the 2x2 block.
  dst_y(x, y) = Halide::saturating_cast<uint8_t>(yuv_tuple(x, y)[0]);
  dst_uv(x, y, c) = Halide::saturating_cast<uint8_t>(Halide::select(
      c == 0, yuv_tuple(x * 2, y * 2)[2], yuv_tuple(x * 2, y * 2)[1]));
  // NOTE: uv channel indices above assume NV21; this can be abstracted out
  // by twiddling strides in calling code.
}

void RgbYuv::schedule() {
  // RGB images starts at index zero in every dimension.
  src_rgb.dim(0).set_min(0);
  src_rgb.dim(1).set_min(0);
  src_rgb.dim(2).set_min(0);

  // Require that the input buffer be interleaved and tightly-packed;
  // that is, either RGBRGBRGB[...] or RGBARGBARGBA[...], without gaps
  // between pixels.
  src_rgb.dim(0).set_stride(src_rgb.dim(2).extent());
  src_rgb.dim(2).set_stride(1);

  // Y plane dimensions start at zero. We could additionally constrain the
  // extent to be even, but that doesn't seem to have any benefit.
  Halide::Func dst_y_func = dst_y;
  Halide::OutputImageParam dst_y_output = dst_y_func.output_buffer();
  dst_y_output.dim(0).set_min(0);
  dst_y_output.dim(1).set_min(0);

  // UV plane has two channels and is half the size of the Y plane in X/Y.
  Halide::Func dst_uv_func = dst_uv;
  Halide::OutputImageParam dst_uv_output = dst_uv_func.output_buffer();
  dst_uv_output.dim(0).set_bounds(0, (dst_y_output.dim(0).extent() + 1) / 2);
  dst_uv_output.dim(1).set_bounds(0, (dst_y_output.dim(1).extent() + 1) / 2);
  dst_uv_output.dim(2).set_bounds(0, 2);

  // UV channel processing should be loop unrolled.
  dst_uv_func.reorder(c, x, y);
  dst_uv_func.unroll(c);

  // Remove default memory layout constraints and accept/produce generic UV
  // (including semi-planar and planar).
  dst_uv_output.dim(0).set_stride(Expr());
}

}  // namespace

HALIDE_REGISTER_GENERATOR(RgbYuv, rgb_yuv_generator)