#include // FFmpeg includes extern "C" { #include #include #include } // ncnn includes #include #include "conversions.h" // Convert AVFrame format AVFrame *convert_avframe_pix_fmt(AVFrame *src_frame, AVPixelFormat pix_fmt) { AVFrame *dst_frame = av_frame_alloc(); if (dst_frame == nullptr) { fprintf(stderr, "Failed to allocate destination AVFrame.\n"); return nullptr; } dst_frame->format = pix_fmt; dst_frame->width = src_frame->width; dst_frame->height = src_frame->height; // Allocate memory for the converted frame if (av_frame_get_buffer(dst_frame, 32) < 0) { fprintf(stderr, "Failed to allocate memory for AVFrame.\n"); av_frame_free(&dst_frame); return nullptr; } // Create a SwsContext for pixel format conversion SwsContext *sws_ctx = sws_getContext( src_frame->width, src_frame->height, static_cast(src_frame->format), dst_frame->width, dst_frame->height, pix_fmt, SWS_BILINEAR, nullptr, nullptr, nullptr ); if (sws_ctx == nullptr) { fprintf(stderr, "Failed to initialize swscale context.\n"); av_frame_free(&dst_frame); return nullptr; } // Perform the conversion sws_scale( sws_ctx, src_frame->data, src_frame->linesize, 0, src_frame->height, dst_frame->data, dst_frame->linesize ); // Clean up sws_freeContext(sws_ctx); return dst_frame; } // Convert AVFrame to ncnn::Mat by copying the data ncnn::Mat avframe_to_ncnn_mat(AVFrame *frame) { AVFrame *converted_frame = nullptr; // Convert to BGR24 format if necessary if (frame->format != AV_PIX_FMT_BGR24) { converted_frame = convert_avframe_pix_fmt(frame, AV_PIX_FMT_BGR24); if (!converted_frame) { fprintf(stderr, "Failed to convert AVFrame to BGR24.\n"); return ncnn::Mat(); // Return an empty ncnn::Mat on failure } } else { converted_frame = frame; // If the frame is already in BGR24, use it directly } // Allocate a new ncnn::Mat and copy the data int width = converted_frame->width; int height = converted_frame->height; ncnn::Mat ncnn_image = ncnn::Mat(width, height, (size_t)3, 3); // BGR has 3 channels // Manually copy the pixel data from AVFrame to the new ncnn::Mat const uint8_t *src_data = converted_frame->data[0]; for (int y = 0; y < height; y++) { uint8_t *dst_row = ncnn_image.row(y); const uint8_t *src_row = src_data + y * converted_frame->linesize[0]; memcpy(dst_row, src_row, width * 3); // Copy 3 channels (BGR) per pixel } // If we allocated a converted frame, free it if (converted_frame != frame) { av_frame_free(&converted_frame); } return ncnn_image; } // Convert ncnn::Mat to AVFrame with a specified pixel format (this part is unchanged) AVFrame *ncnn_mat_to_avframe(const ncnn::Mat &mat, AVPixelFormat pix_fmt) { int ret; // Step 1: Allocate a destination AVFrame for the specified pixel format AVFrame *dst_frame = av_frame_alloc(); if (!dst_frame) { fprintf(stderr, "Failed to allocate destination AVFrame.\n"); return nullptr; } dst_frame->format = pix_fmt; dst_frame->width = mat.w; dst_frame->height = mat.h; // Allocate memory for the frame buffer if (av_frame_get_buffer(dst_frame, 32) < 0) { fprintf(stderr, "Failed to allocate memory for destination AVFrame.\n"); av_frame_free(&dst_frame); return nullptr; } // Step 2: Convert ncnn::Mat to BGR AVFrame AVFrame *bgr_frame = av_frame_alloc(); if (!bgr_frame) { fprintf(stderr, "Failed to allocate intermediate BGR AVFrame.\n"); av_frame_free(&dst_frame); return nullptr; } bgr_frame->format = AV_PIX_FMT_BGR24; bgr_frame->width = mat.w; bgr_frame->height = mat.h; // Allocate memory for the intermediate BGR frame if (av_frame_get_buffer(bgr_frame, 32) < 0) { fprintf(stderr, "Failed to allocate memory for BGR AVFrame.\n"); av_frame_free(&dst_frame); av_frame_free(&bgr_frame); return nullptr; } // Copy data from ncnn::Mat to the BGR AVFrame // mat.to_pixels(bgr_frame->data[0], ncnn::Mat::PIXEL_BGR); // Manually copy the pixel data from ncnn::Mat to the BGR AVFrame for (int y = 0; y < mat.h; y++) { uint8_t *dst_row = bgr_frame->data[0] + y * bgr_frame->linesize[0]; const uint8_t *src_row = mat.row(y); memcpy(dst_row, src_row, mat.w * 3); // Copy 3 channels (BGR) per pixel } // Step 3: Convert the BGR frame to the desired pixel format SwsContext *sws_ctx = sws_getContext( bgr_frame->width, bgr_frame->height, AV_PIX_FMT_BGR24, dst_frame->width, dst_frame->height, pix_fmt, SWS_BILINEAR, nullptr, nullptr, nullptr ); if (sws_ctx == nullptr) { fprintf(stderr, "Failed to initialize swscale context.\n"); av_frame_free(&bgr_frame); av_frame_free(&dst_frame); return nullptr; } // Perform the conversion ret = sws_scale( sws_ctx, bgr_frame->data, bgr_frame->linesize, 0, bgr_frame->height, dst_frame->data, dst_frame->linesize ); // Clean up sws_freeContext(sws_ctx); av_frame_free(&bgr_frame); if (ret != dst_frame->height) { fprintf(stderr, "Failed to convert BGR AVFrame to destination pixel format.\n"); av_frame_free(&dst_frame); return nullptr; } return dst_frame; }