diff --git a/src/util/media_capture.cpp b/src/util/media_capture.cpp index fa16795d32..8c29abdfb4 100644 --- a/src/util/media_capture.cpp +++ b/src/util/media_capture.cpp @@ -585,7 +585,7 @@ class MediaCaptureMF final : public MediaCaptureBase Error* error); bool GetAudioTypes(std::string_view codec, ComPtr* input_type, ComPtr* output_type, u32 sample_rate, u32 bitrate, Error* error); - static void ConvertVideoFrame(u8* dst, size_t dst_stride, const u8* src, size_t src_stride, u32 width, u32 height); + void ConvertVideoFrame(u8* dst, size_t dst_stride, const u8* src, size_t src_stride, u32 width, u32 height) const; bool ProcessVideoOutputSamples(Error* error); // synchronous bool ProcessVideoEvents(Error* error); // asynchronous @@ -1041,48 +1041,67 @@ MediaCaptureMF::ComPtr MediaCaptureMF::CreateVideoEncodeTransform( } ALWAYS_INLINE_RELEASE void MediaCaptureMF::ConvertVideoFrame(u8* dst, size_t dst_stride, const u8* src, - size_t src_stride, u32 width, u32 height) + size_t src_stride, u32 width, u32 height) const { - // need to convert rgba -> bgra, as well as flipping vertically - const u32 vector_width = 4; - const u32 aligned_width = Common::AlignDownPow2(width, vector_width); - if (!g_gpu_device->UsesLowerLeftOrigin()) { src += src_stride * (height - 1); src_stride = static_cast(-static_cast>(src_stride)); } - for (u32 remaining_rows = height;;) + if (m_video_render_texture_format == GPUTexture::Format::RGBA8) { - const u8* row_src = src; - u8* row_dst = dst; - - u32 x = 0; - for (; x < aligned_width; x += vector_width) + // need to convert rgba -> bgra, as well as flipping vertically + const u32 vector_width = 4; + const u32 aligned_width = Common::AlignDownPow2(width, vector_width); + for (u32 remaining_rows = height;;) { - static constexpr GSVector4i mask = GSVector4i::cxpr8(2, 1, 0, 3, 6, 5, 4, 7, 10, 9, 8, 11, 14, 13, 12, 15); - GSVector4i::store(row_dst, GSVector4i::load(row_src).shuffle8(mask)); - row_src += vector_width * sizeof(u32); - row_dst += vector_width * sizeof(u32); - } + const u8* row_src = src; + u8* row_dst = dst; - for (; x < width; x++) - { - row_dst[0] = row_src[2]; - row_dst[1] = row_src[1]; - row_dst[2] = row_src[0]; - row_dst[3] = row_src[3]; - row_src += sizeof(u32); - row_dst += sizeof(u32); - } + u32 x = 0; + for (; x < aligned_width; x += vector_width) + { + static constexpr GSVector4i mask = GSVector4i::cxpr8(2, 1, 0, 3, 6, 5, 4, 7, 10, 9, 8, 11, 14, 13, 12, 15); + GSVector4i::store(row_dst, GSVector4i::load(row_src).shuffle8(mask)); + row_src += vector_width * sizeof(u32); + row_dst += vector_width * sizeof(u32); + } - src += src_stride; - dst += dst_stride; + for (; x < width; x++) + { + row_dst[0] = row_src[2]; + row_dst[1] = row_src[1]; + row_dst[2] = row_src[0]; + row_dst[3] = row_src[3]; + row_src += sizeof(u32); + row_dst += sizeof(u32); + } - remaining_rows--; - if (remaining_rows == 0) - break; + src += src_stride; + dst += dst_stride; + + remaining_rows--; + if (remaining_rows == 0) + break; + } + } + else + { + // only flip + const u32 copy_width = sizeof(u32) * width; + for (u32 remaining_rows = height;;) + { + const u8* row_src = src; + u8* row_dst = dst; + std::memcpy(row_dst, row_src, copy_width); + src += src_stride; + dst += dst_stride; + + remaining_rows--; + if (remaining_rows == 0) + break; + } } }