main/cpp/RenderScriptToolkit.h

*32afb93cSXin Li/*
*32afb93cSXin Li * Copyright (C) 2021 The Android Open Source Project
*32afb93cSXin Li *
*32afb93cSXin Li * Licensed under the Apache License, Version 2.0 (the "License");
*32afb93cSXin Li * you may not use this file except in compliance with the License.
*32afb93cSXin Li * You may obtain a copy of the License at
*32afb93cSXin Li *
*32afb93cSXin Li *      http://www.apache.org/licenses/LICENSE-2.0
*32afb93cSXin Li *
*32afb93cSXin Li * Unless required by applicable law or agreed to in writing, software
*32afb93cSXin Li * distributed under the License is distributed on an "AS IS" BASIS,
*32afb93cSXin Li * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
*32afb93cSXin Li * See the License for the specific language governing permissions and
*32afb93cSXin Li * limitations under the License.
*32afb93cSXin Li */
*32afb93cSXin Li
*32afb93cSXin Li#ifndef ANDROID_RENDERSCRIPT_TOOLKIT_TOOLKIT_H
*32afb93cSXin Li#define ANDROID_RENDERSCRIPT_TOOLKIT_TOOLKIT_H
*32afb93cSXin Li
*32afb93cSXin Li#include <cstdint>
*32afb93cSXin Li#include <memory>
*32afb93cSXin Li
*32afb93cSXin Linamespace renderscript {
*32afb93cSXin Li
*32afb93cSXin Liclass TaskProcessor;
*32afb93cSXin Li
*32afb93cSXin Li/**
*32afb93cSXin Li * Define a range of data to process.
*32afb93cSXin Li *
*32afb93cSXin Li * This class is used to restrict a Toolkit operation to a rectangular subset of the input
*32afb93cSXin Li * tensor.
*32afb93cSXin Li *
*32afb93cSXin Li * @property startX The index of the first value to be included on the X axis.
*32afb93cSXin Li * @property endX The index after the last value to be included on the X axis.
*32afb93cSXin Li * @property startY The index of the first value to be included on the Y axis.
*32afb93cSXin Li * @property endY The index after the last value to be included on the Y axis.
*32afb93cSXin Li */
*32afb93cSXin Listruct Restriction {
*32afb93cSXin Li    size_t startX;
*32afb93cSXin Li    size_t endX;
*32afb93cSXin Li    size_t startY;
*32afb93cSXin Li    size_t endY;
*32afb93cSXin Li};
*32afb93cSXin Li
*32afb93cSXin Li/**
*32afb93cSXin Li * A collection of high-performance graphic utility functions like blur and blend.
*32afb93cSXin Li *
*32afb93cSXin Li * This toolkit provides ten image manipulation functions: blend, blur, color matrix, convolve,
*32afb93cSXin Li * histogram, histogramDot, lut, lut3d, resize, and YUV to RGB. These functions execute
*32afb93cSXin Li * multithreaded on the CPU.
*32afb93cSXin Li *
*32afb93cSXin Li * These functions work over raw byte arrays. You'll need to specify the width and height of
*32afb93cSXin Li * the data to be processed, as well as the number of bytes per pixel. For most use cases,
*32afb93cSXin Li * this will be 4.
*32afb93cSXin Li *
*32afb93cSXin Li * You should instantiate the Toolkit once and reuse it throughout your application.
*32afb93cSXin Li * On instantiation, the Toolkit creates a thread pool that's used for processing all the functions.
*32afb93cSXin Li * You can limit the number of pool threads used by the Toolkit via the constructor. The pool
*32afb93cSXin Li * threads are destroyed once the Toolkit is destroyed, after any pending work is done.
*32afb93cSXin Li *
*32afb93cSXin Li * This library is thread safe. You can call methods from different pool threads. The functions will
*32afb93cSXin Li * execute sequentially.
*32afb93cSXin Li *
*32afb93cSXin Li * A Java/Kotlin Toolkit is available. It calls this library through JNI.
*32afb93cSXin Li *
*32afb93cSXin Li * This toolkit can be used as a replacement for most RenderScript Intrinsic functions. Compared
*32afb93cSXin Li * to RenderScript, it's simpler to use and more than twice as fast on the CPU. However RenderScript
*32afb93cSXin Li * Intrinsics allow more flexibility for the type of allocation supported. In particular, this
*32afb93cSXin Li * toolkit does not support allocations of floats.
*32afb93cSXin Li */
*32afb93cSXin Liclass RenderScriptToolkit {
*32afb93cSXin Li    /** Each Toolkit method call is converted to a Task. The processor owns the thread pool. It
*32afb93cSXin Li     * tiles the tasks and schedule them over the pool threads.
*32afb93cSXin Li     */
*32afb93cSXin Li    std::unique_ptr<TaskProcessor> processor;
*32afb93cSXin Li
*32afb93cSXin Li   public:
*32afb93cSXin Li    /**
*32afb93cSXin Li     * Creates the pool threads that are used for processing the method calls.
*32afb93cSXin Li     */
*32afb93cSXin Li    RenderScriptToolkit(int numberOfThreads = 0);
*32afb93cSXin Li    /**
*32afb93cSXin Li     * Destroys the thread pool. This stops any in-progress work; the Toolkit methods called from
*32afb93cSXin Li     * other pool threads will return without having completed the work. Because of the undefined
*32afb93cSXin Li     * state of the output buffers, an application should avoid destroying the Toolkit if other pool
*32afb93cSXin Li     * threads are executing Toolkit methods.
*32afb93cSXin Li     */
*32afb93cSXin Li    ~RenderScriptToolkit();
*32afb93cSXin Li
*32afb93cSXin Li    /**
*32afb93cSXin Li     * Determines how a source buffer is blended into a destination buffer.
*32afb93cSXin Li     *
*32afb93cSXin Li     * See {@link RenderScriptToolkit::blend}.
*32afb93cSXin Li     *
*32afb93cSXin Li     * blend only works on 4 byte RGBA data. In the descriptions below, ".a" represents
*32afb93cSXin Li     * the alpha channel.
*32afb93cSXin Li     */
*32afb93cSXin Li    enum class BlendingMode {
*32afb93cSXin Li        /**
*32afb93cSXin Li         * dest = 0
*32afb93cSXin Li         *
*32afb93cSXin Li         * The destination is cleared, i.e. each pixel is set to (0, 0, 0, 0)
*32afb93cSXin Li         */
*32afb93cSXin Li        CLEAR = 0,
*32afb93cSXin Li        /**
*32afb93cSXin Li         * dest = src
*32afb93cSXin Li         *
*32afb93cSXin Li         * Sets each pixel of the destination to the corresponding one in the source.
*32afb93cSXin Li         */
*32afb93cSXin Li        SRC = 1,
*32afb93cSXin Li        /**
*32afb93cSXin Li         * dest = dest
*32afb93cSXin Li         *
*32afb93cSXin Li         * Leaves the destination untouched. This is a no-op.
*32afb93cSXin Li         */
*32afb93cSXin Li        DST = 2,
*32afb93cSXin Li        /**
*32afb93cSXin Li         * dest = src + dest * (1.0 - src.a)
*32afb93cSXin Li         */
*32afb93cSXin Li        SRC_OVER = 3,
*32afb93cSXin Li        /**
*32afb93cSXin Li         * dest = dest + src * (1.0 - dest.a)
*32afb93cSXin Li         */
*32afb93cSXin Li        DST_OVER = 4,
*32afb93cSXin Li        /**
*32afb93cSXin Li         * dest = src * dest.a
*32afb93cSXin Li         */
*32afb93cSXin Li        SRC_IN = 5,
*32afb93cSXin Li        /**
*32afb93cSXin Li         * dest = dest * src.a
*32afb93cSXin Li         */
*32afb93cSXin Li        DST_IN = 6,
*32afb93cSXin Li        /**
*32afb93cSXin Li         * dest = src * (1.0 - dest.a)
*32afb93cSXin Li         */
*32afb93cSXin Li        SRC_OUT = 7,
*32afb93cSXin Li        /**
*32afb93cSXin Li         * dest = dest * (1.0 - src.a)
*32afb93cSXin Li         */
*32afb93cSXin Li        DST_OUT = 8,
*32afb93cSXin Li        /**
*32afb93cSXin Li         * dest.rgb = src.rgb * dest.a + (1.0 - src.a) * dest.rgb, dest.a = dest.a
*32afb93cSXin Li         */
*32afb93cSXin Li        SRC_ATOP = 9,
*32afb93cSXin Li        /**
*32afb93cSXin Li         * dest = dest.rgb * src.a + (1.0 - dest.a) * src.rgb, dest.a = src.a
*32afb93cSXin Li         */
*32afb93cSXin Li        DST_ATOP = 10,
*32afb93cSXin Li        /**
*32afb93cSXin Li         * dest = {src.r ^ dest.r, src.g ^ dest.g, src.b ^ dest.b, src.a ^ dest.a}
*32afb93cSXin Li         *
*32afb93cSXin Li         * Note: this is NOT the Porter/Duff XOR mode; this is a bitwise xor.
*32afb93cSXin Li         */
*32afb93cSXin Li        XOR = 11,
*32afb93cSXin Li        /**
*32afb93cSXin Li         * dest = src * dest
*32afb93cSXin Li         */
*32afb93cSXin Li        MULTIPLY = 12,
*32afb93cSXin Li        /**
*32afb93cSXin Li         * dest = min(src + dest, 1.0)
*32afb93cSXin Li         */
*32afb93cSXin Li        ADD = 13,
*32afb93cSXin Li        /**
*32afb93cSXin Li         * dest = max(dest - src, 0.0)
*32afb93cSXin Li         */
*32afb93cSXin Li        SUBTRACT = 14
*32afb93cSXin Li    };
*32afb93cSXin Li
*32afb93cSXin Li    /**
*32afb93cSXin Li     * Blend a source buffer with the destination buffer.
*32afb93cSXin Li     *
*32afb93cSXin Li     * Blends a source buffer and a destination buffer, placing the result in the destination
*32afb93cSXin Li     * buffer. The blending is done pairwise between two corresponding RGBA values found in
*32afb93cSXin Li     * each buffer. The mode parameter specifies one of fifteen blending operations.
*32afb93cSXin Li     * See {@link BlendingMode}.
*32afb93cSXin Li     *
*32afb93cSXin Li     * An optional range parameter can be set to restrict the operation to a rectangular subset
*32afb93cSXin Li     * of each buffer. If provided, the range must be wholly contained with the dimensions
*32afb93cSXin Li     * described by sizeX and sizeY.
*32afb93cSXin Li     *
*32afb93cSXin Li     * The source and destination buffers must have the same dimensions. Both buffers should be
*32afb93cSXin Li     * large enough for sizeX * sizeY * 4 bytes. The buffers have a row-major layout.
*32afb93cSXin Li     *
*32afb93cSXin Li     * @param mode The specific blending operation to do.
*32afb93cSXin Li     * @param source The RGBA input buffer.
*32afb93cSXin Li     * @param dest The destination buffer. Used for input and output.
*32afb93cSXin Li     * @param sizeX The width of both buffers, as a number of RGBA values.
*32afb93cSXin Li     * @param sizeY The height of both buffers, as a number of RGBA values.
*32afb93cSXin Li     * @param restriction When not null, restricts the operation to a 2D range of pixels.
*32afb93cSXin Li     */
*32afb93cSXin Li    void blend(BlendingMode mode, const uint8_t* _Nonnull source, uint8_t* _Nonnull dst,
*32afb93cSXin Li               size_t sizeX, size_t sizeY, const Restriction* _Nullable restriction = nullptr);
*32afb93cSXin Li
*32afb93cSXin Li    /**
*32afb93cSXin Li     * Blur an image.
*32afb93cSXin Li     *
*32afb93cSXin Li     * Performs a Gaussian blur of the input image and stores the result in the out buffer.
*32afb93cSXin Li     *
*32afb93cSXin Li     * The radius determines which pixels are used to compute each blurred pixels. This Toolkit
*32afb93cSXin Li     * accepts values between 1 and 25. Larger values create a more blurred effect but also
*32afb93cSXin Li     * take longer to compute. When the radius extends past the edge, the edge pixel will
*32afb93cSXin Li     * be used as replacement for the pixel that's out off boundary.
*32afb93cSXin Li     *
*32afb93cSXin Li     * Each input pixel can either be represented by four bytes (RGBA format) or one byte
*32afb93cSXin Li     * for the less common blurring of alpha channel only image.
*32afb93cSXin Li     *
*32afb93cSXin Li     * An optional range parameter can be set to restrict the operation to a rectangular subset
*32afb93cSXin Li     * of each buffer. If provided, the range must be wholly contained with the dimensions
*32afb93cSXin Li     * described by sizeX and sizeY.
*32afb93cSXin Li     *
*32afb93cSXin Li     * The input and output buffers must have the same dimensions. Both buffers should be
*32afb93cSXin Li     * large enough for sizeX * sizeY * vectorSize bytes. The buffers have a row-major layout.
*32afb93cSXin Li     *
*32afb93cSXin Li     * @param in The buffer of the image to be blurred.
*32afb93cSXin Li     * @param out The buffer that receives the blurred image.
*32afb93cSXin Li     * @param sizeX The width of both buffers, as a number of 1 or 4 byte cells.
*32afb93cSXin Li     * @param sizeY The height of both buffers, as a number of 1 or 4 byte cells.
*32afb93cSXin Li     * @param vectorSize Either 1 or 4, the number of bytes in each cell, i.e. A vs. RGBA.
*32afb93cSXin Li     * @param radius The radius of the pixels used to blur.
*32afb93cSXin Li     * @param restriction When not null, restricts the operation to a 2D range of pixels.
*32afb93cSXin Li     */
*32afb93cSXin Li    void blur(const uint8_t* _Nonnull in, uint8_t* _Nonnull out, size_t sizeX, size_t sizeY,
*32afb93cSXin Li              size_t vectorSize, int radius, const Restriction* _Nullable restriction = nullptr);
*32afb93cSXin Li
*32afb93cSXin Li    /**
*32afb93cSXin Li     * Identity matrix that can be passed to the {@link RenderScriptToolkit::colorMatrix} method.
*32afb93cSXin Li     *
*32afb93cSXin Li     * Using this matrix will result in no change to the pixel through multiplication although
*32afb93cSXin Li     * the pixel value can still be modified by the add vector, or transformed to a different
*32afb93cSXin Li     * format.
*32afb93cSXin Li     */
*32afb93cSXin Li    static constexpr float kIdentityMatrix[] =  {
*32afb93cSXin Li            1.0f, 0.0f, 0.0f, 0.0f,
*32afb93cSXin Li            0.0f, 1.0f, 0.0f, 0.0f,
*32afb93cSXin Li            0.0f, 0.0f, 1.0f, 0.0f,
*32afb93cSXin Li            0.0f, 0.0f, 0.0f, 1.0f
*32afb93cSXin Li    };
*32afb93cSXin Li
*32afb93cSXin Li    /**
*32afb93cSXin Li     * Matrix to turn color pixels to a grey scale.
*32afb93cSXin Li     *
*32afb93cSXin Li     * Use this matrix with the {@link RenderScriptToolkit::colorMatrix} method to convert an
*32afb93cSXin Li     * image from color to greyscale.
*32afb93cSXin Li     */
*32afb93cSXin Li    static constexpr float kGreyScaleColorMatrix[] = {
*32afb93cSXin Li            0.299f, 0.299f, 0.299f, 0.0f,
*32afb93cSXin Li            0.587f, 0.587f, 0.587f, 0.0f,
*32afb93cSXin Li            0.114f, 0.114f, 0.114f, 0.0f,
*32afb93cSXin Li            0.0f,   0.0f,   0.0f,   1.0f
*32afb93cSXin Li    };
*32afb93cSXin Li
*32afb93cSXin Li    /**
*32afb93cSXin Li     * Matrix to convert RGB to YUV.
*32afb93cSXin Li     *
*32afb93cSXin Li     * Use this matrix with the {@link RenderScriptToolkit::colorMatrix} method to convert the
*32afb93cSXin Li     * first three bytes of each pixel from RGB to YUV. This leaves the last byte (the alpha
*32afb93cSXin Li     * channel) untouched.
*32afb93cSXin Li     *
*32afb93cSXin Li     * This is a simplistic conversion. Most YUV buffers have more complicated format, not supported
*32afb93cSXin Li     * by this method.
*32afb93cSXin Li     */
*32afb93cSXin Li    static constexpr float kRgbToYuvMatrix[] = {
*32afb93cSXin Li            0.299f, -0.14713f,  0.615f,   0.0f,
*32afb93cSXin Li            0.587f, -0.28886f, -0.51499f, 0.0f,
*32afb93cSXin Li            0.114f,  0.436f,   -0.10001f, 0.0f,
*32afb93cSXin Li            0.0f,    0.0f,      0.0f,     1.0f
*32afb93cSXin Li    };
*32afb93cSXin Li
*32afb93cSXin Li    /**
*32afb93cSXin Li     * Matrix to convert YUV to RGB.
*32afb93cSXin Li     *
*32afb93cSXin Li     * Use this matrix with the {@link RenderScriptToolkit::colorMatrix} method to convert the
*32afb93cSXin Li     * first three bytes of each pixel from YUV to RGB. This leaves the last byte (the alpha
*32afb93cSXin Li     * channel) untouched.
*32afb93cSXin Li     *
*32afb93cSXin Li     * This is a simplistic conversion. Most YUV buffers have more complicated format, not supported
*32afb93cSXin Li     * by this method. Use {@link RenderScriptToolkit::yuvToRgb} to convert these buffers.
*32afb93cSXin Li     */
*32afb93cSXin Li    static constexpr float kYuvToRgbMatrix[] = {
*32afb93cSXin Li            1.0f,      1.0f,     1.0f,     0.0f,
*32afb93cSXin Li            0.0f,     -0.39465f, 2.03211f, 0.0f,
*32afb93cSXin Li            1.13983f, -0.5806f,  0.0f,     0.0f,
*32afb93cSXin Li            0.0f,      0.0f,     0.0f,     1.0f
*32afb93cSXin Li    };
*32afb93cSXin Li
*32afb93cSXin Li    /**
*32afb93cSXin Li     * Transform an image using a color matrix.
*32afb93cSXin Li     *
*32afb93cSXin Li     * Converts a 2D array of vectors of unsigned bytes, multiplying each vectors by a 4x4 matrix
*32afb93cSXin Li     * and adding an optional vector.
*32afb93cSXin Li     *
*32afb93cSXin Li     * Each input vector is composed of 1-4 unsigned bytes. If less than 4 bytes, it's extended to
*32afb93cSXin Li     * 4, padding with zeroes. The unsigned bytes are converted from 0-255 to 0.0-1.0 floats
*32afb93cSXin Li     * before the multiplication is done.
*32afb93cSXin Li     *
*32afb93cSXin Li     * The resulting value is normalized from 0.0-1.0 to a 0-255 value and stored in the output.
*32afb93cSXin Li     * If the output vector size is less than four, the unused channels are discarded.
*32afb93cSXin Li     *
*32afb93cSXin Li     * If addVector is null, a vector of zeroes is added, i.e. a noop.
*32afb93cSXin Li     *
*32afb93cSXin Li     * Check kIdentityMatrix, kGreyScaleColorMatrix, kRgbToYuvMatrix, and kYuvToRgbMatrix for sample
*32afb93cSXin Li     * matrices. The YUV conversion may not work for all color spaces.
*32afb93cSXin Li     *
*32afb93cSXin Li     * @param in The buffer of the image to be converted.
*32afb93cSXin Li     * @param out The buffer that receives the converted image.
*32afb93cSXin Li     * @param inputVectorSize The number of bytes in each input cell, a value from 1 to 4.
*32afb93cSXin Li     * @param outputVectorSize The number of bytes in each output cell, a value from 1 to 4.
*32afb93cSXin Li     * @param sizeX The width of both buffers, as a number of 1 to 4 byte cells.
*32afb93cSXin Li     * @param sizeY The height of both buffers, as a number of 1 to 4 byte cells.
*32afb93cSXin Li     * @param matrix The 4x4 matrix to multiply, in row major format.
*32afb93cSXin Li     * @param addVector A vector of four floats that's added to the result of the multiplication.
*32afb93cSXin Li     * @param restriction When not null, restricts the operation to a 2D range of pixels.
*32afb93cSXin Li     */
*32afb93cSXin Li    void colorMatrix(const void* _Nonnull in, void* _Nonnull out, size_t inputVectorSize,
*32afb93cSXin Li                     size_t outputVectorSize, size_t sizeX, size_t sizeY,
*32afb93cSXin Li                     const float* _Nonnull matrix, const float* _Nullable addVector = nullptr,
*32afb93cSXin Li                     const Restriction* _Nullable restriction = nullptr);
*32afb93cSXin Li
*32afb93cSXin Li    /**
*32afb93cSXin Li     * Convolve a ByteArray.
*32afb93cSXin Li     *
*32afb93cSXin Li     * Applies a 3x3 or 5x5 convolution to the input array using the provided coefficients.
*32afb93cSXin Li     *
*32afb93cSXin Li     * For 3x3 convolutions, 9 coefficients must be provided. For 5x5, 25 coefficients are needed.
*32afb93cSXin Li     * The coefficients should be provided in row-major format.
*32afb93cSXin Li     *
*32afb93cSXin Li     * When the square extends past the edge, the edge values will be used as replacement for the
*32afb93cSXin Li     * values that's are off boundary.
*32afb93cSXin Li     *
*32afb93cSXin Li     * Each input cell can either be represented by one to four bytes. Each byte is multiplied
*32afb93cSXin Li     * and accumulated independently of the other bytes of the cell.
*32afb93cSXin Li     *
*32afb93cSXin Li     * An optional range parameter can be set to restrict the operation to a rectangular subset
*32afb93cSXin Li     * of each buffer. If provided, the range must be wholly contained with the dimensions
*32afb93cSXin Li     * described by sizeX and sizeY.
*32afb93cSXin Li     *
*32afb93cSXin Li     * The input and output buffers must have the same dimensions. Both buffers should be
*32afb93cSXin Li     * large enough for sizeX * sizeY * vectorSize bytes. The buffers have a row-major layout.
*32afb93cSXin Li     *
*32afb93cSXin Li     * @param in The buffer of the image to be blurred.
*32afb93cSXin Li     * @param out The buffer that receives the blurred image.
*32afb93cSXin Li     * @param vectorSize The number of bytes in each cell, a value from 1 to 4.
*32afb93cSXin Li     * @param sizeX The width of both buffers, as a number of 1 or 4 byte cells.
*32afb93cSXin Li     * @param sizeY The height of both buffers, as a number of 1 or 4 byte cells.
*32afb93cSXin Li     * @param coefficients 9 or 25 multipliers.
*32afb93cSXin Li     * @param restriction When not null, restricts the operation to a 2D range of pixels.
*32afb93cSXin Li     */
*32afb93cSXin Li    void convolve3x3(const void* _Nonnull in, void* _Nonnull out, size_t vectorSize, size_t sizeX,
*32afb93cSXin Li                     size_t sizeY, const float* _Nonnull coefficients,
*32afb93cSXin Li                     const Restriction* _Nullable restriction = nullptr);
*32afb93cSXin Li
*32afb93cSXin Li    void convolve5x5(const void* _Nonnull in, void* _Nonnull out, size_t vectorSize, size_t sizeX,
*32afb93cSXin Li                     size_t sizeY, const float* _Nonnull coefficients,
*32afb93cSXin Li                     const Restriction* _Nullable restriction = nullptr);
*32afb93cSXin Li
*32afb93cSXin Li    /**
*32afb93cSXin Li     * Compute the histogram of an image.
*32afb93cSXin Li     *
*32afb93cSXin Li     * Tallies how many times each of the 256 possible values of a byte is found in the input.
*32afb93cSXin Li     *
*32afb93cSXin Li     * An input cell can be represented by one to four bytes. The tally is done independently
*32afb93cSXin Li     * for each of the bytes of the cell. Correspondingly, the out array will have
*32afb93cSXin Li     * 256 * vectorSize entries. The counts for value 0 are consecutive, followed by those for
*32afb93cSXin Li     * value 1, etc.
*32afb93cSXin Li     *
*32afb93cSXin Li     * An optional range parameter can be set to restrict the operation to a rectangular subset
*32afb93cSXin Li     * of each buffer. If provided, the range must be wholly contained with the dimensions
*32afb93cSXin Li     * described by sizeX and sizeY.
*32afb93cSXin Li     *
*32afb93cSXin Li     * The source buffers should be large enough for sizeX * sizeY * vectorSize bytes. The buffers
*32afb93cSXin Li     * have a row-major layout. The out buffer should be large enough for 256 * vectorSize ints.
*32afb93cSXin Li     *
*32afb93cSXin Li     * @param in The buffer of the image to be analyzed.
*32afb93cSXin Li     * @param out The resulting vector of counts.
*32afb93cSXin Li     * @param sizeX The width of the input buffers, as a number of 1 or 4 byte cells.
*32afb93cSXin Li     * @param sizeY The height of the input buffers, as a number of 1 or 4 byte cells.
*32afb93cSXin Li     * @param vectorSize The number of bytes in each cell, a value from 1 to 4.
*32afb93cSXin Li     * @param restriction When not null, restricts the operation to a 2D range of pixels.
*32afb93cSXin Li     */
*32afb93cSXin Li    void histogram(const uint8_t* _Nonnull in, int32_t* _Nonnull out, size_t sizeX, size_t sizeY,
*32afb93cSXin Li                   size_t vectorSize, const Restriction* _Nullable restriction = nullptr);
*32afb93cSXin Li
*32afb93cSXin Li    /**
*32afb93cSXin Li     * Compute the histogram of the dot product of an image.
*32afb93cSXin Li     *
*32afb93cSXin Li     * This method supports cells of 1 to 4 bytes in length. For each cell of the array,
*32afb93cSXin Li     * the dot product of its bytes with the provided coefficients is computed. The resulting
*32afb93cSXin Li     * floating point value is converted to an unsigned byte and tallied in the histogram.
*32afb93cSXin Li     *
*32afb93cSXin Li     * If coefficients is null, the coefficients used for RGBA luminosity calculation will be used,
*32afb93cSXin Li     * i.e. the values [0.299f, 0.587f, 0.114f, 0.f].
*32afb93cSXin Li     *
*32afb93cSXin Li     * Each coefficients must be >= 0 and their sum must be 1.0 or less. There must be the same
*32afb93cSXin Li     * number of coefficients as vectorSize.
*32afb93cSXin Li     *
*32afb93cSXin Li     * An optional range parameter can be set to restrict the operation to a rectangular subset
*32afb93cSXin Li     * of each buffer. If provided, the range must be wholly contained with the dimensions
*32afb93cSXin Li     * described by sizeX and sizeY.
*32afb93cSXin Li     *
*32afb93cSXin Li     * The source buffers should be large enough for sizeX * sizeY * vectorSize bytes. The buffers
*32afb93cSXin Li     * have a row-major layout. The out array should be large enough for 256 ints.
*32afb93cSXin Li     *
*32afb93cSXin Li     * @param in The buffer of the image to be analyzed.
*32afb93cSXin Li     * @param out The resulting vector of counts.
*32afb93cSXin Li     * @param sizeX The width of the input buffers, as a number of 1 or 4 byte cells.
*32afb93cSXin Li     * @param sizeY The height of the input buffers, as a number of 1 or 4 byte cells.
*32afb93cSXin Li     * @param vectorSize The number of bytes in each cell, a value from 1 to 4.
*32afb93cSXin Li     * @param coefficients The values used for the dot product. Can be nullptr.
*32afb93cSXin Li     * @param restriction When not null, restricts the operation to a 2D range of pixels.
*32afb93cSXin Li     */
*32afb93cSXin Li    void histogramDot(const uint8_t* _Nonnull in, int32_t* _Nonnull out, size_t sizeX, size_t sizeY,
*32afb93cSXin Li                      size_t vectorSize, const float* _Nullable coefficients,
*32afb93cSXin Li                      const Restriction* _Nullable restriction = nullptr);
*32afb93cSXin Li
*32afb93cSXin Li    /**
*32afb93cSXin Li     * Transform an image using a look up table
*32afb93cSXin Li     *
*32afb93cSXin Li     * Transforms an image by using a per-channel lookup table. Each channel of the input has an
*32afb93cSXin Li     * independent lookup table. The tables are 256 entries in size and can cover the full value
*32afb93cSXin Li     * range of a byte.
*32afb93cSXin Li     *
*32afb93cSXin Li     * The input array should be in RGBA format, where four consecutive bytes form an cell.
*32afb93cSXin Li     *
*32afb93cSXin Li     * An optional range parameter can be set to restrict the operation to a rectangular subset
*32afb93cSXin Li     * of each buffer. If provided, the range must be wholly contained with the dimensions
*32afb93cSXin Li     * described by sizeX and sizeY.
*32afb93cSXin Li     *
*32afb93cSXin Li     * The input and output buffers must have the same dimensions. Both buffers should be
*32afb93cSXin Li     * large enough for sizeX * sizeY * vectorSize bytes. The buffers have a row-major layout.
*32afb93cSXin Li     *
*32afb93cSXin Li     * @param in The buffer of the image to be transformed.
*32afb93cSXin Li     * @param out The buffer that receives the transformed image.
*32afb93cSXin Li     * @param sizeX The width of both buffers, as a number of 4 byte cells.
*32afb93cSXin Li     * @param sizeY The height of both buffers, as a number of 4 byte cells.
*32afb93cSXin Li     * @param red An array of 256 values that's used to convert the R channel.
*32afb93cSXin Li     * @param green An array of 256 values that's used to convert the G channel.
*32afb93cSXin Li     * @param blue An array of 256 values that's used to convert the B channel.
*32afb93cSXin Li     * @param alpha An array of 256 values that's used to convert the A channel.
*32afb93cSXin Li     * @param restriction When not null, restricts the operation to a 2D range of pixels.
*32afb93cSXin Li     */
*32afb93cSXin Li    void lut(const uint8_t* _Nonnull in, uint8_t* _Nonnull out, size_t sizeX, size_t sizeY,
*32afb93cSXin Li             const uint8_t* _Nonnull red, const uint8_t* _Nonnull green,
*32afb93cSXin Li             const uint8_t* _Nonnull blue, const uint8_t* _Nonnull alpha,
*32afb93cSXin Li             const Restriction* _Nullable restriction = nullptr);
*32afb93cSXin Li
*32afb93cSXin Li    /**
*32afb93cSXin Li     * Transform an image using a 3D look up table
*32afb93cSXin Li     *
*32afb93cSXin Li     * Transforms an image, converting RGB to RGBA by using a 3D lookup table. The incoming R, G,
*32afb93cSXin Li     * and B values are normalized to the dimensions of the provided 3D buffer. The eight nearest
*32afb93cSXin Li     * values in that 3D buffer are sampled and linearly interpolated. The resulting RGBA entry
*32afb93cSXin Li     * is stored in the output.
*32afb93cSXin Li     *
*32afb93cSXin Li     * The input array should be in RGBA format, where four consecutive bytes form an cell.
*32afb93cSXin Li     * The fourth byte of each input cell is ignored.
*32afb93cSXin Li     *
*32afb93cSXin Li     * An optional range parameter can be set to restrict the operation to a rectangular subset
*32afb93cSXin Li     * of each buffer. If provided, the range must be wholly contained with the dimensions
*32afb93cSXin Li     * described by sizeX and sizeY.
*32afb93cSXin Li     *
*32afb93cSXin Li     * The input and output buffers must have the same dimensions. Both buffers should be
*32afb93cSXin Li     * large enough for sizeX * sizeY * vectorSize bytes. The buffers have a row-major layout.
*32afb93cSXin Li     *
*32afb93cSXin Li     * @param in The buffer of the image to be transformed.
*32afb93cSXin Li     * @param out The buffer that receives the transformed image.
*32afb93cSXin Li     * @param sizeX The width of both buffers, as a number of 4 byte cells.
*32afb93cSXin Li     * @param sizeY The height of both buffers, as a number of 4 byte cells.
*32afb93cSXin Li     * @param cube The translation cube, in row major-format.
*32afb93cSXin Li     * @param cubeSizeX The number of RGBA entries in the cube in the X direction.
*32afb93cSXin Li     * @param cubeSizeY The number of RGBA entries in the cube in the Y direction.
*32afb93cSXin Li     * @param cubeSizeZ The number of RGBA entries in the cube in the Z direction.
*32afb93cSXin Li     * @param restriction When not null, restricts the operation to a 2D range of pixels.
*32afb93cSXin Li     */
*32afb93cSXin Li    void lut3d(const uint8_t* _Nonnull in, uint8_t* _Nonnull out, size_t sizeX, size_t sizeY,
*32afb93cSXin Li               const uint8_t* _Nonnull cube, size_t cubeSizeX, size_t cubeSizeY, size_t cubeSizeZ,
*32afb93cSXin Li               const Restriction* _Nullable restriction = nullptr);
*32afb93cSXin Li
*32afb93cSXin Li    /**
*32afb93cSXin Li     * Resize an image.
*32afb93cSXin Li     *
*32afb93cSXin Li     * Resizes an image using bicubic interpolation.
*32afb93cSXin Li     *
*32afb93cSXin Li     * This method supports cells of 1 to 4 bytes in length. Each byte of the cell is
*32afb93cSXin Li     * interpolated independently from the others.
*32afb93cSXin Li     *
*32afb93cSXin Li     * An optional range parameter can be set to restrict the operation to a rectangular subset
*32afb93cSXin Li     * of the output buffer. The corresponding scaled range of the input will be used.  If provided,
*32afb93cSXin Li     * the range must be wholly contained with the dimensions described by outputSizeX and
*32afb93cSXin Li     * outputSizeY.
*32afb93cSXin Li     *
*32afb93cSXin Li     * The input and output buffers have a row-major layout. Both buffers should be
*32afb93cSXin Li     * large enough for sizeX * sizeY * vectorSize bytes.
*32afb93cSXin Li     *
*32afb93cSXin Li     * @param in The buffer of the image to be resized.
*32afb93cSXin Li     * @param out The buffer that receives the resized image.
*32afb93cSXin Li     * @param inputSizeX The width of the input buffer, as a number of 1-4 byte cells.
*32afb93cSXin Li     * @param inputSizeY The height of the input buffer, as a number of 1-4 byte cells.
*32afb93cSXin Li     * @param vectorSize The number of bytes in each cell of both buffers. A value from 1 to 4.
*32afb93cSXin Li     * @param outputSizeX The width of the output buffer, as a number of 1-4 byte cells.
*32afb93cSXin Li     * @param outputSizeY The height of the output buffer, as a number of 1-4 byte cells.
*32afb93cSXin Li     * @param restriction When not null, restricts the operation to a 2D range of pixels.
*32afb93cSXin Li     */
*32afb93cSXin Li    void resize(const uint8_t* _Nonnull in, uint8_t* _Nonnull out, size_t inputSizeX,
*32afb93cSXin Li                size_t inputSizeY, size_t vectorSize, size_t outputSizeX, size_t outputSizeY,
*32afb93cSXin Li                const Restriction* _Nullable restriction = nullptr);
*32afb93cSXin Li
*32afb93cSXin Li    /**
*32afb93cSXin Li     * The YUV formats supported by yuvToRgb.
*32afb93cSXin Li     */
*32afb93cSXin Li    enum class YuvFormat {
*32afb93cSXin Li        NV21 = 0x11,
*32afb93cSXin Li        YV12 = 0x32315659,
*32afb93cSXin Li    };
*32afb93cSXin Li
*32afb93cSXin Li    /**
*32afb93cSXin Li     * Convert an image from YUV to RGB.
*32afb93cSXin Li     *
*32afb93cSXin Li     * Converts an Android YUV buffer to RGB. The input allocation should be
*32afb93cSXin Li     * supplied in a supported YUV format as a YUV cell Allocation.
*32afb93cSXin Li     * The output is RGBA; the alpha channel will be set to 255.
*32afb93cSXin Li     *
*32afb93cSXin Li     * Note that for YV12 and a sizeX that's not a multiple of 32, the
*32afb93cSXin Li     * RenderScript Intrinsic may not have converted the image correctly.
*32afb93cSXin Li     * This Toolkit method should.
*32afb93cSXin Li     *
*32afb93cSXin Li     * @param in The buffer of the image to be converted.
*32afb93cSXin Li     * @param out The buffer that receives the converted image.
*32afb93cSXin Li     * @param sizeX The width in pixels of the image. Must be even.
*32afb93cSXin Li     * @param sizeY The height in pixels of the image.
*32afb93cSXin Li     * @param format Either YV12 or NV21.
*32afb93cSXin Li     */
*32afb93cSXin Li    void yuvToRgb(const uint8_t* _Nonnull in, uint8_t* _Nonnull out, size_t sizeX, size_t sizeY,
*32afb93cSXin Li                  YuvFormat format);
*32afb93cSXin Li};
*32afb93cSXin Li
*32afb93cSXin Li}  // namespace renderscript
*32afb93cSXin Li
*32afb93cSXin Li#endif  // ANDROID_RENDERSCRIPT_TOOLKIT_TOOLKIT_H