video2x/src/conversions.cpp

#include <cstdio>

// FFmpeg includes
extern "C" {
#include <libavutil/frame.h>
#include <libavutil/imgutils.h>
#include <libswscale/swscale.h>
}

// ncnn includes
#include <mat.h>

#include "conversions.h"

// Convert AVFrame format
AVFrame *convert_avframe_pix_fmt(AVFrame *src_frame, AVPixelFormat pix_fmt) {
    AVFrame *dst_frame = av_frame_alloc();
    if (dst_frame == nullptr) {
        fprintf(stderr, "Failed to allocate destination AVFrame.\n");
        return nullptr;
    }

    dst_frame->format = pix_fmt;
    dst_frame->width = src_frame->width;
    dst_frame->height = src_frame->height;

    // Allocate memory for the converted frame
    if (av_frame_get_buffer(dst_frame, 32) < 0) {
        fprintf(stderr, "Failed to allocate memory for AVFrame.\n");
        av_frame_free(&dst_frame);
        return nullptr;
    }

    // Create a SwsContext for pixel format conversion
    SwsContext *sws_ctx = sws_getContext(
        src_frame->width,
        src_frame->height,
        static_cast<AVPixelFormat>(src_frame->format),
        dst_frame->width,
        dst_frame->height,
        pix_fmt,
        SWS_BILINEAR,
        nullptr,
        nullptr,
        nullptr
    );

    if (sws_ctx == nullptr) {
        fprintf(stderr, "Failed to initialize swscale context.\n");
        av_frame_free(&dst_frame);
        return nullptr;
    }

    // Perform the conversion
    sws_scale(
        sws_ctx,
        src_frame->data,
        src_frame->linesize,
        0,
        src_frame->height,
        dst_frame->data,
        dst_frame->linesize
    );

    // Clean up
    sws_freeContext(sws_ctx);

    return dst_frame;
}

// Convert AVFrame to ncnn::Mat by copying the data
ncnn::Mat avframe_to_ncnn_mat(AVFrame *frame) {
    AVFrame *converted_frame = nullptr;

    // Convert to BGR24 format if necessary
    if (frame->format != AV_PIX_FMT_BGR24) {
        converted_frame = convert_avframe_pix_fmt(frame, AV_PIX_FMT_BGR24);
        if (!converted_frame) {
            fprintf(stderr, "Failed to convert AVFrame to BGR24.\n");
            return ncnn::Mat();  // Return an empty ncnn::Mat on failure
        }
    } else {
        converted_frame = frame;  // If the frame is already in BGR24, use it directly
    }

    // Allocate a new ncnn::Mat and copy the data
    int width = converted_frame->width;
    int height = converted_frame->height;
    ncnn::Mat ncnn_image = ncnn::Mat(width, height, (size_t)3, 3);  // BGR has 3 channels

    // Manually copy the pixel data from AVFrame to the new ncnn::Mat
    const uint8_t *src_data = converted_frame->data[0];
    for (int y = 0; y < height; y++) {
        uint8_t *dst_row = ncnn_image.row<uint8_t>(y);
        const uint8_t *src_row = src_data + y * converted_frame->linesize[0];
        memcpy(dst_row, src_row, width * 3);  // Copy 3 channels (BGR) per pixel
    }

    // If we allocated a converted frame, free it
    if (converted_frame != frame) {
        av_frame_free(&converted_frame);
    }

    return ncnn_image;
}

// Convert ncnn::Mat to AVFrame with a specified pixel format (this part is unchanged)
AVFrame *ncnn_mat_to_avframe(const ncnn::Mat &mat, AVPixelFormat pix_fmt) {
    int ret;

    // Step 1: Allocate a destination AVFrame for the specified pixel format
    AVFrame *dst_frame = av_frame_alloc();
    if (!dst_frame) {
        fprintf(stderr, "Failed to allocate destination AVFrame.\n");
        return nullptr;
    }

    dst_frame->format = pix_fmt;
    dst_frame->width = mat.w;
    dst_frame->height = mat.h;

    // Allocate memory for the frame buffer
    if (av_frame_get_buffer(dst_frame, 32) < 0) {
        fprintf(stderr, "Failed to allocate memory for destination AVFrame.\n");
        av_frame_free(&dst_frame);
        return nullptr;
    }

    // Step 2: Convert ncnn::Mat to BGR AVFrame
    AVFrame *bgr_frame = av_frame_alloc();
    if (!bgr_frame) {
        fprintf(stderr, "Failed to allocate intermediate BGR AVFrame.\n");
        av_frame_free(&dst_frame);
        return nullptr;
    }

    bgr_frame->format = AV_PIX_FMT_BGR24;
    bgr_frame->width = mat.w;
    bgr_frame->height = mat.h;

    // Allocate memory for the intermediate BGR frame
    if (av_frame_get_buffer(bgr_frame, 32) < 0) {
        fprintf(stderr, "Failed to allocate memory for BGR AVFrame.\n");
        av_frame_free(&dst_frame);
        av_frame_free(&bgr_frame);
        return nullptr;
    }

    // Copy data from ncnn::Mat to the BGR AVFrame
    // mat.to_pixels(bgr_frame->data[0], ncnn::Mat::PIXEL_BGR);

    // Manually copy the pixel data from ncnn::Mat to the BGR AVFrame
    for (int y = 0; y < mat.h; y++) {
        uint8_t *dst_row = bgr_frame->data[0] + y * bgr_frame->linesize[0];
        const uint8_t *src_row = mat.row<const uint8_t>(y);
        memcpy(dst_row, src_row, mat.w * 3);  // Copy 3 channels (BGR) per pixel
    }

    // Step 3: Convert the BGR frame to the desired pixel format
    SwsContext *sws_ctx = sws_getContext(
        bgr_frame->width,
        bgr_frame->height,
        AV_PIX_FMT_BGR24,
        dst_frame->width,
        dst_frame->height,
        pix_fmt,
        SWS_BILINEAR,
        nullptr,
        nullptr,
        nullptr
    );

    if (sws_ctx == nullptr) {
        fprintf(stderr, "Failed to initialize swscale context.\n");
        av_frame_free(&bgr_frame);
        av_frame_free(&dst_frame);
        return nullptr;
    }

    // Perform the conversion
    ret = sws_scale(
        sws_ctx,
        bgr_frame->data,
        bgr_frame->linesize,
        0,
        bgr_frame->height,
        dst_frame->data,
        dst_frame->linesize
    );

    // Clean up
    sws_freeContext(sws_ctx);
    av_frame_free(&bgr_frame);

    if (ret != dst_frame->height) {
        fprintf(stderr, "Failed to convert BGR AVFrame to destination pixel format.\n");
        av_frame_free(&dst_frame);
        return nullptr;
    }

    return dst_frame;
}
feat(*): rewritten the project with C/C++ (#1172) 2024-10-08 02:29:00 +00:00			`#include <cstdio>`

			`// FFmpeg includes`
			`extern "C" {`
			`#include <libavutil/frame.h>`
			`#include <libavutil/imgutils.h>`
			`#include <libswscale/swscale.h>`
			`}`

			`// ncnn includes`
			`#include <mat.h>`

			`#include "conversions.h"`

			`// Convert AVFrame format`
			`AVFrame convert_avframe_pix_fmt(AVFrame src_frame, AVPixelFormat pix_fmt) {`
			`AVFrame *dst_frame = av_frame_alloc();`
			`if (dst_frame == nullptr) {`
			`fprintf(stderr, "Failed to allocate destination AVFrame.\n");`
			`return nullptr;`
			`}`

			`dst_frame->format = pix_fmt;`
			`dst_frame->width = src_frame->width;`
			`dst_frame->height = src_frame->height;`

			`// Allocate memory for the converted frame`
			`if (av_frame_get_buffer(dst_frame, 32) < 0) {`
			`fprintf(stderr, "Failed to allocate memory for AVFrame.\n");`
			`av_frame_free(&dst_frame);`
			`return nullptr;`
			`}`

			`// Create a SwsContext for pixel format conversion`
			`SwsContext *sws_ctx = sws_getContext(`
			`src_frame->width,`
			`src_frame->height,`
			`static_cast<AVPixelFormat>(src_frame->format),`
			`dst_frame->width,`
			`dst_frame->height,`
			`pix_fmt,`
			`SWS_BILINEAR,`
			`nullptr,`
			`nullptr,`
			`nullptr`
			`);`

			`if (sws_ctx == nullptr) {`
			`fprintf(stderr, "Failed to initialize swscale context.\n");`
			`av_frame_free(&dst_frame);`
			`return nullptr;`
			`}`

			`// Perform the conversion`
			`sws_scale(`
			`sws_ctx,`
			`src_frame->data,`
			`src_frame->linesize,`
			`0,`
			`src_frame->height,`
			`dst_frame->data,`
			`dst_frame->linesize`
			`);`

			`// Clean up`
			`sws_freeContext(sws_ctx);`

			`return dst_frame;`
			`}`

			`// Convert AVFrame to ncnn::Mat by copying the data`
			`ncnn::Mat avframe_to_ncnn_mat(AVFrame *frame) {`
			`AVFrame *converted_frame = nullptr;`

			`// Convert to BGR24 format if necessary`
			`if (frame->format != AV_PIX_FMT_BGR24) {`
			`converted_frame = convert_avframe_pix_fmt(frame, AV_PIX_FMT_BGR24);`
			`if (!converted_frame) {`
			`fprintf(stderr, "Failed to convert AVFrame to BGR24.\n");`
			`return ncnn::Mat(); // Return an empty ncnn::Mat on failure`
			`}`
			`} else {`
			`converted_frame = frame; // If the frame is already in BGR24, use it directly`
			`}`

			`// Allocate a new ncnn::Mat and copy the data`
			`int width = converted_frame->width;`
			`int height = converted_frame->height;`
			`ncnn::Mat ncnn_image = ncnn::Mat(width, height, (size_t)3, 3); // BGR has 3 channels`

			`// Manually copy the pixel data from AVFrame to the new ncnn::Mat`
			`const uint8_t *src_data = converted_frame->data[0];`
			`for (int y = 0; y < height; y++) {`
			`uint8_t *dst_row = ncnn_image.row<uint8_t>(y);`
			`const uint8_t src_row = src_data + y converted_frame->linesize[0];`
			`memcpy(dst_row, src_row, width * 3); // Copy 3 channels (BGR) per pixel`
			`}`

			`// If we allocated a converted frame, free it`
			`if (converted_frame != frame) {`
			`av_frame_free(&converted_frame);`
			`}`

			`return ncnn_image;`
			`}`

			`// Convert ncnn::Mat to AVFrame with a specified pixel format (this part is unchanged)`
			`AVFrame *ncnn_mat_to_avframe(const ncnn::Mat &mat, AVPixelFormat pix_fmt) {`
			`int ret;`

			`// Step 1: Allocate a destination AVFrame for the specified pixel format`
			`AVFrame *dst_frame = av_frame_alloc();`
			`if (!dst_frame) {`
			`fprintf(stderr, "Failed to allocate destination AVFrame.\n");`
			`return nullptr;`
			`}`

			`dst_frame->format = pix_fmt;`
			`dst_frame->width = mat.w;`
			`dst_frame->height = mat.h;`

			`// Allocate memory for the frame buffer`
			`if (av_frame_get_buffer(dst_frame, 32) < 0) {`
			`fprintf(stderr, "Failed to allocate memory for destination AVFrame.\n");`
			`av_frame_free(&dst_frame);`
			`return nullptr;`
			`}`

			`// Step 2: Convert ncnn::Mat to BGR AVFrame`
			`AVFrame *bgr_frame = av_frame_alloc();`
			`if (!bgr_frame) {`
			`fprintf(stderr, "Failed to allocate intermediate BGR AVFrame.\n");`
			`av_frame_free(&dst_frame);`
			`return nullptr;`
			`}`

			`bgr_frame->format = AV_PIX_FMT_BGR24;`
			`bgr_frame->width = mat.w;`
			`bgr_frame->height = mat.h;`

			`// Allocate memory for the intermediate BGR frame`
			`if (av_frame_get_buffer(bgr_frame, 32) < 0) {`
			`fprintf(stderr, "Failed to allocate memory for BGR AVFrame.\n");`
			`av_frame_free(&dst_frame);`
			`av_frame_free(&bgr_frame);`
			`return nullptr;`
			`}`

			`// Copy data from ncnn::Mat to the BGR AVFrame`
			`// mat.to_pixels(bgr_frame->data[0], ncnn::Mat::PIXEL_BGR);`

			`// Manually copy the pixel data from ncnn::Mat to the BGR AVFrame`
			`for (int y = 0; y < mat.h; y++) {`
			`uint8_t dst_row = bgr_frame->data[0] + y bgr_frame->linesize[0];`
			`const uint8_t *src_row = mat.row<const uint8_t>(y);`
			`memcpy(dst_row, src_row, mat.w * 3); // Copy 3 channels (BGR) per pixel`
			`}`

			`// Step 3: Convert the BGR frame to the desired pixel format`
			`SwsContext *sws_ctx = sws_getContext(`
			`bgr_frame->width,`
			`bgr_frame->height,`
			`AV_PIX_FMT_BGR24,`
			`dst_frame->width,`
			`dst_frame->height,`
			`pix_fmt,`
			`SWS_BILINEAR,`
			`nullptr,`
			`nullptr,`
			`nullptr`
			`);`

			`if (sws_ctx == nullptr) {`
			`fprintf(stderr, "Failed to initialize swscale context.\n");`
			`av_frame_free(&bgr_frame);`
			`av_frame_free(&dst_frame);`
			`return nullptr;`
			`}`

			`// Perform the conversion`
			`ret = sws_scale(`
			`sws_ctx,`
			`bgr_frame->data,`
			`bgr_frame->linesize,`
			`0,`
			`bgr_frame->height,`
			`dst_frame->data,`
			`dst_frame->linesize`
			`);`

			`// Clean up`
			`sws_freeContext(sws_ctx);`
			`av_frame_free(&bgr_frame);`

			`if (ret != dst_frame->height) {`
			`fprintf(stderr, "Failed to convert BGR AVFrame to destination pixel format.\n");`
			`av_frame_free(&dst_frame);`
			`return nullptr;`
			`}`

			`return dst_frame;`
			`}`