UltraGrid/test/ff_codec_conversions_test.cpp

#ifdef HAVE_CONFIG_H
#include "config.h"
#include "config_unix.h"
#include "config_win32.h"
#endif

#if defined HAVE_CPPUNIT && defined HAVE_LAVC

#include <algorithm>
#include <array>
#include <cppunit/config/SourcePrefix.h>
#include <iostream>
#include <random>
#include <string>
#include <vector>

#include "ff_codec_conversions_test.h"
#include "libavcodec_common.h"
#include "tv.h"
#include "video_capture/testcard_common.h"
#include "video_codec.h"

using namespace std::string_literals;

using std::array;
using std::copy;
using std::cout;
using std::default_random_engine;
using std::uniform_int_distribution;
using std::ifstream;
using std::min;
using std::max;
using std::to_string;
using std::vector;

constexpr int MIN_12B = 16;
constexpr int MAX_12B = 4079;


// Registers the fixture into the 'registry'
CPPUNIT_TEST_SUITE_REGISTRATION( ff_codec_conversions_test );

ff_codec_conversions_test::ff_codec_conversions_test()
{
}

ff_codec_conversions_test::~ff_codec_conversions_test()
{
}

void
ff_codec_conversions_test::setUp()
{
}

void
ff_codec_conversions_test::tearDown()
{
}

#define TIMER(t) struct timeval t{}; gettimeofday(&(t), nullptr)
void
ff_codec_conversions_test::test_yuv444pXXle_from_to_r10k()
{
        using namespace std::string_literals;

        constexpr int width = 320;
        constexpr int height = 240;
        vector <unsigned char> rgba_buf(width * height * 4);

        /// @todo Use 10-bit natively
        auto test_pattern = [&](AVPixelFormat avfmt) {
                vector <unsigned char> r10k_buf(width * height * 4);
                copy(rgba_buf.begin(), rgba_buf.end(), r10k_buf.begin());
                auto vc_copylineRGBAtoR10k = get_decoder_from_to(RGBA, R10k, true);
                assert(vc_copylineRGBAtoR10k != nullptr);
                vc_copylineRGBAtoR10k(r10k_buf.data(), r10k_buf.data(), 4L * width * height, 0, 8, 16);

                AVFrame frame;
                frame.format = avfmt;
                frame.width = width;
                frame.height = height;

                /* the image can be allocated by any means and av_image_alloc() is
                 * just the most convenient way if av_malloc() is to be used */
                assert(av_image_alloc(frame.data, frame.linesize,
                                        width, height, (AVPixelFormat) frame.format, 32) >= 0);

                auto from_conv = get_uv_to_av_conversion(R10k, frame.format);
                auto to_conv = get_av_to_uv_conversion(frame.format, R10k);
                assert(to_conv != nullptr && from_conv != nullptr);

                TIMER(t0);
                from_conv(&frame, r10k_buf.data(), width, height);
                TIMER(t1);
                to_conv(reinterpret_cast<char*>(r10k_buf.data()), &frame, width, height, vc_get_linesize(width, R10k), nullptr);
                TIMER(t2);

                if (getenv("PERF") != nullptr) {
                        cout << "test_yuv444p16le_from_to_r10k: duration - enc " << tv_diff(t1, t0) << ", dec " <<tv_diff(t2, t1) << "\n";
                }

                av_freep(frame.data);

                vector <unsigned char> rgba_buf_res(width * height * 4);
                vc_copyliner10k(rgba_buf_res.data(), r10k_buf.data(), height * vc_get_linesize(width, RGBA), 0, 8, 16);

                int max_diff = 0;
                for (size_t i = 0; i < width * height; ++i) {
                        for (int j = 0; j < 3; ++j) {
                                max_diff = max<int>(max_diff, abs(rgba_buf[4 * i + j] - rgba_buf_res[4 * i + j]));
                                //fprintf(stderr, "%d %d\n", (int) rgba_buf[4 * i + j], (int) rgba_buf_res[4 * i + j]);
                        }
                        //fprintf(stderr, "R in 10 bits = %d\n", (int) (r10k_buf[4 * i] << 2) + (r10k_buf[4 * i + 1] >> 6));
                }

                if (getenv("DEBUG_DUMP") != nullptr) {
                        FILE *out = fopen("out.rgba","w");
                        fwrite(rgba_buf_res.data(), width * height * 4, 1, out);
                        fclose(out);
                }

                CPPUNIT_ASSERT_MESSAGE("Maximal allowed difference 1, found "s + to_string(max_diff), max_diff <= 1);
        };

        for (auto f : { AV_PIX_FMT_YUV444P10LE, AV_PIX_FMT_YUV444P12LE, AV_PIX_FMT_YUV444P16LE }) {
                int i = 0;
                for_each(rgba_buf.begin(), rgba_buf.end(), [&](unsigned char & c) { c = (i++ / 4) % 0x100; });
                test_pattern(f);

                array<unsigned char, 4> pattern{ 0xFFU, 0, 0, 0xFFU };
                for_each(rgba_buf.begin(), rgba_buf.end(), [&](unsigned char & c) { c = pattern[i++ % 4]; });
                test_pattern(f);

                default_random_engine rand_gen;
                for_each(rgba_buf.begin(), rgba_buf.end(), [&](unsigned char & c) { c = rand_gen() % 0x100; });
                test_pattern(f);
        }
}

void
ff_codec_conversions_test::test_yuv444pXXle_from_to_r12l()
{
        using namespace std::string_literals;

        constexpr int width = 320;
        constexpr int height = 240;
        vector <unsigned char> rgb_buf(width * height * 3);

        /// @todo Use 12-bit natively
        auto test_pattern = [&](AVPixelFormat avfmt) {
                vector <unsigned char> r12l_buf(vc_get_datalen(width, height, R12L));
                decoder_t rgb_to_r12l = get_decoder_from_to(RGB, R12L, true);
                rgb_to_r12l(r12l_buf.data(), rgb_buf.data(), vc_get_datalen(width, height, R12L), 0, 8, 16);

                AVFrame frame;
                frame.format = avfmt;
                frame.width = width;
                frame.height = height;

                /* the image can be allocated by any means and av_image_alloc() is
                 * just the most convenient way if av_malloc() is to be used */
                assert(av_image_alloc(frame.data, frame.linesize,
                                        width, height, (AVPixelFormat) frame.format, 32) >= 0);

                auto from_conv = get_uv_to_av_conversion(R12L, frame.format);
                auto to_conv = get_av_to_uv_conversion(frame.format, R12L);
                assert(to_conv != nullptr && from_conv != nullptr);

                TIMER(t0);
                from_conv(&frame, r12l_buf.data(), width, height);
                TIMER(t1);
                to_conv(reinterpret_cast<char*>(r12l_buf.data()), &frame, width, height, vc_get_linesize(width, R12L), nullptr);
                TIMER(t2);

                if (getenv("PERF") != nullptr) {
                        cout << "test_yuv444p16le_from_to_r12l: duration - enc " << tv_diff(t1, t0) << ", dec " <<tv_diff(t2, t1) << "\n";
                }

                av_freep(frame.data);

                vector <unsigned char> rgb_buf_res(width * height * 3);
                decoder_t r12l_to_rgb = get_decoder_from_to(R12L, RGB, true);
                r12l_to_rgb(rgb_buf_res.data(), r12l_buf.data(), vc_get_datalen(width, height, RGB), 0, 8, 16);

                int max_diff = 0;
                for (size_t i = 0; i < width * height; ++i) {
                        for (int j = 0; j < 3; ++j) {
                                max_diff = max<int>(max_diff, abs(rgb_buf[3 * i + j] - rgb_buf_res[3 * i + j]));
                        }
                }

                if (getenv("DEBUG_DUMP") != nullptr) {
                        FILE *out = fopen("out.rgb","w");
                        fwrite(rgb_buf_res.data(), width * height * 3, 1, out);
                        fclose(out);
                }

                CPPUNIT_ASSERT_MESSAGE("Maximal allowed difference 1, found "s + to_string(max_diff), max_diff <= 1);
        };

        for (auto f : { AV_PIX_FMT_YUV444P10LE, AV_PIX_FMT_YUV444P12LE, AV_PIX_FMT_YUV444P16LE }) {
                int i = 0;
                array<unsigned char, 3> pattern{ 0xFFU, 0, 0 };
                for_each(rgb_buf.begin(), rgb_buf.end(), [&](unsigned char & c) { c = pattern[i++ % 3]; });
                test_pattern(f);

                for_each(rgb_buf.begin(), rgb_buf.end(), [&](unsigned char & c) { c = (i++ / 3) % 0x100; });
                test_pattern(f);

                default_random_engine rand_gen;
                for_each(rgb_buf.begin(), rgb_buf.end(), [&](unsigned char & c) { c = rand_gen() % 0x100; });
                test_pattern(f);
        }
}

static void yuv444p16le_rg48_encode_decode(int width, int height, char *in, char *out) {
        AVFrame frame{};
        frame.format = AV_PIX_FMT_YUV444P16LE;
        frame.width = width;
        frame.height = height;

        /* the image can be allocated by any means and av_image_alloc() is
         * just the most convenient way if av_malloc() is to be used */
        if (av_image_alloc(frame.data, frame.linesize,
                                width, height, (AVPixelFormat) frame.format, 32) < 0) {
                abort();
        }

        auto from_conv = get_uv_to_av_conversion(RG48, frame.format);
        auto to_conv = get_av_to_uv_conversion(frame.format, RG48);
        assert(to_conv != nullptr && from_conv != nullptr);

        TIMER(t0);
        from_conv(&frame, reinterpret_cast<unsigned char *>(in), width, height);
        TIMER(t1);
        to_conv(reinterpret_cast<char*>(out), &frame, width, height, vc_get_linesize(width, RG48), nullptr);
        TIMER(t2);

        if (getenv("PERF") != nullptr) {
                cout << "test_yuv444p16le_from_to_rg48: duration - enc " << tv_diff(t1, t0) << ", dec " <<tv_diff(t2, t1) << "\n";
        }

        av_freep(frame.data);
}

/**
 * Tests 12-bit values 0-4096 - max allowed range is MIN_12B-MAX_12B which should be
 * also the output - so comparing the output values against clamped input value. Also
 * using lower delta to accept because of the claming.
 */
void ff_codec_conversions_test::test_yuv444p16le_from_to_rg48_out_of_range()
{
        using namespace std::string_literals;

        constexpr int MAX_DIFF = 16;

        constexpr int width = 4096;
        constexpr int height = 5;
        vector <uint16_t> rg48_buf(width * height * 3);
        vector <uint16_t> rg48_buf_res(width * height * 3);

        for (int i = 0; i < 4096; i += 1) { // grayscale tones
                rg48_buf[3 * i] =
                        rg48_buf[3 * i + 1] =
                        rg48_buf[3 * i + 2] = 65535 * i / 4095;
        }
        for (int line = 0; line < 3; ++line) { // R, G, B scale
                for (int i = 0; i < 4096; i += 1) {
                        rg48_buf[(line + 1) * (width * 3) + 3 * i + line] = 65535 * i / 4095;
                }
        }
        for (int i = 0; i < 4096; i += 1) { // custom
                rg48_buf[4 * (width * 3) + 3 * i] = 65535;
                rg48_buf[4 * (width * 3) + 3 * i + 1] = 65535;
                rg48_buf[4 * (width * 3) + 3 * i + 2] = 0;
        }

        yuv444p16le_rg48_encode_decode(width, height, reinterpret_cast<char *>(rg48_buf.data()),
                        reinterpret_cast<char *>(rg48_buf_res.data()));

        int max_diff = 0;
        for (size_t i = 0; i < width * height; ++i) {
                for (int j = 0; j < 3; ++j) {
                        int in = rg48_buf[3 * i + j];
                        in = min(max(MIN_12B << 4U, in), MAX_12B << 4U);
                        int out = rg48_buf_res[3 * i + j];
                        int diff = in - out;
                        if (abs(diff) >= MAX_DIFF && getenv("DEBUG") != nullptr) {
                                cout << "different value at pos: " << i << "," << j << " diff: " << diff << "\n";
                        }
                        max_diff = max<int>(max_diff, abs(diff));
                        out >>= 4;
                        CPPUNIT_ASSERT_MESSAGE("Value "s + to_string(out) + " out of range "s + to_string(MIN_12B) + "-"s + to_string(MAX_12B), out >= MIN_12B && out <= MAX_12B);
                }
        }

        if (getenv("DEBUG_DUMP") != nullptr) {
                std::ofstream in("in.rg48", std::ifstream::out | std::ifstream::binary);
                in.write(reinterpret_cast<char *>(rg48_buf.data()), rg48_buf.size() * sizeof(decltype(rg48_buf)::value_type));
                std::ofstream out("out.rg48", std::ifstream::out | std::ifstream::binary);
                out.write(reinterpret_cast<char *>(rg48_buf_res.data()), rg48_buf_res.size() * sizeof(decltype(rg48_buf_res)::value_type));
        }

        CPPUNIT_ASSERT_MESSAGE("Maximal allowed difference "s + to_string (MAX_DIFF) + "/65535, found "s + to_string(max_diff), max_diff <= MAX_DIFF);
}

/**
 * Tests RG48<->YUV444P16LE conversions with 12-bit RGB input values
 * (full-range with the SDI small headroom)
 */
void ff_codec_conversions_test::test_yuv444p16le_from_to_rg48()
{
        constexpr int MAX_DIFF = 16; /// @todo look at the conversions to yield better precision

        int width = 2048;
        int height = 1;
        vector <uint16_t> rg48_buf(width * height * 3, MIN_12B << 4); // SDI minimal value
        vector <uint16_t> rg48_buf_res(width * height * 3);

        for (int i = 16; i < 2040; i += 1) {
                rg48_buf[3 * i] =
                        rg48_buf[3 * i + 1] =
                        rg48_buf[3 * i + 2] = (i * 2) << 4;
        }
        for (int i = 2040; i < 2048; i += 1) {
                rg48_buf[3 * i] =
                        rg48_buf[3 * i + 1] =
                        rg48_buf[3 * i + 2] = MAX_12B << 4;
        }

        if (getenv("UG_TEST_RG48_INPUT") != nullptr) {
                char *cpy = strdup(getenv("UG_TEST_RG48_INPUT"));
                char *filename = strtok(cpy, ":");
                width = atoi(strtok(nullptr, ":"));
                height = atoi(strtok(nullptr, ":"));
                rg48_buf.resize(width * height * 3);
                rg48_buf_res.resize(width * height * 3);
                ifstream in(filename, std::ifstream::in | std::ifstream::binary);
                in.read(reinterpret_cast<char *>(rg48_buf.data()), rg48_buf.size() * sizeof(decltype(rg48_buf)::value_type));
        }

        yuv444p16le_rg48_encode_decode(width, height, reinterpret_cast<char *>(rg48_buf.data()),
                        reinterpret_cast<char *>(rg48_buf_res.data()));

        int max_diff = 0;
        for (int i = 0; i < width * height; ++i) {
                for (int j = 0; j < 3; ++j) {
                        int in = rg48_buf[3 * i + j];
                        int out = rg48_buf_res[3 * i + j];
                        int diff = in - out;
                        if (abs(diff) >= MAX_DIFF && getenv("DEBUG") != nullptr) {
                                cout << "different value at pos: " << i << "," << j << " diff: " << diff << " in: " << in << " out: " << out << "\n";
                        }
                        max_diff = max<int>(max_diff, abs(diff));
                        out >>= 4;
                        CPPUNIT_ASSERT_MESSAGE("Value "s + to_string(out) + " out of range "s + to_string(MIN_12B) + "-"s + to_string(MAX_12B), out >= MIN_12B && out <= MAX_12B);
                }
        }

        if (getenv("DEBUG_DUMP") != nullptr) {
                std::ofstream in("in.rg48", std::ifstream::out | std::ifstream::binary);
                in.write(reinterpret_cast<char *>(rg48_buf.data()), rg48_buf.size() * sizeof(decltype(rg48_buf)::value_type));
                std::ofstream out("out.rg48", std::ifstream::out | std::ifstream::binary);
                out.write(reinterpret_cast<char *>(rg48_buf_res.data()), rg48_buf_res.size() * sizeof(decltype(rg48_buf_res)::value_type));
        }

        CPPUNIT_ASSERT_MESSAGE("Maximal allowed difference "s + to_string (MAX_DIFF) + "/65535, found "s + to_string(max_diff), max_diff <= MAX_DIFF);
}

/**
 * Just a simple test - use just dummy random data
 * @todo
 * Write more reasonable comparison to check P010LE with different neigboring lines.
 */
void ff_codec_conversions_test::test_pX10_from_to_v210()
{
        constexpr codec_t codec = v210;
        constexpr long width = 1920;
        constexpr long height = 4;
        const long linesize = vc_get_linesize(width, codec);
        vector <unsigned char> in(height * linesize);
        vector <unsigned char> out(height * linesize);
        default_random_engine rand_gen;
        uniform_int_distribution<uint32_t> dist(0, 0x3fffffffLU);

        for (auto &c : {AV_PIX_FMT_P010LE, AV_PIX_FMT_P210LE}) {
                AVFrame frame{};
                frame.format = c;
                frame.width = 1920;
                frame.height = 1080;
                if (av_image_alloc(frame.data, frame.linesize,
                                        width, height, (AVPixelFormat) frame.format, 32) < 0) {
                        abort();
                }

                if (c == AV_PIX_FMT_P210LE) {
                        std::for_each((uint32_t *) in.data(), (uint32_t *) (in.data() + height * linesize), [&](uint32_t & c) { c = dist(rand_gen); });
                } else { // later using dummy "==" compare, chroma in odd and even line must be same for P010 to avoid rounding errors
                        std::for_each((uint32_t *) in.data(), (uint32_t *) (in.data() + linesize), [&](uint32_t & c) { c =  dist(rand_gen); });
                        for (int i = 1; i < height; ++i) {
                                std::copy(in.data(), &in[linesize], &in[i * linesize]);
                        }
                }

                auto from_conv = get_uv_to_av_conversion(codec, frame.format);
                auto to_conv = get_av_to_uv_conversion(frame.format, codec);
                assert(from_conv != nullptr);
                assert(to_conv != nullptr);

                from_conv(&frame, in.data(), width, height);
                to_conv(reinterpret_cast<char *>(out.data()), &frame, width, height, vc_get_linesize(width, codec), nullptr);

                if (getenv("DEBUG_DUMP") != nullptr) {
                        for (int i = 0; i < 128; i += 1) {
                                auto *din = reinterpret_cast<uint32_t *>(in.data()) + i * 4;
                                auto *dout = reinterpret_cast<uint32_t *>(out.data()) + i * 4;
                                printf("0x%08x IN =%08x %08x %08x %08x\n", i * 16, din[0], din[1], din[2], din[3]);
                                printf("0x%08x OUT=%08x %08x %08x %08x\n", i * 16, dout[0], dout[1], dout[2], dout[3]);
                        }
                }

                CPPUNIT_ASSERT_MESSAGE("Error: output doesn't match input"s, in == out);
                out[(width / 2) * height] = 123;
                CPPUNIT_ASSERT_MESSAGE("Error: output matches input but it shouldn't"s, in != out);
                av_freep(frame.data);
        }
}

#endif // defined HAVE_CPPUNIT && HAVE_LAVC