Merge pull request #2073 from lioncash/opus
hwopus: Implement DecodeInterleaved (the newest variant)
This commit is contained in:
		@@ -5,7 +5,6 @@
 | 
			
		||||
#include <chrono>
 | 
			
		||||
#include <cstring>
 | 
			
		||||
#include <memory>
 | 
			
		||||
#include <optional>
 | 
			
		||||
#include <vector>
 | 
			
		||||
 | 
			
		||||
#include <opus.h>
 | 
			
		||||
@@ -30,48 +29,66 @@ public:
 | 
			
		||||
                                u32 channel_count)
 | 
			
		||||
        : ServiceFramework("IHardwareOpusDecoderManager"), decoder(std::move(decoder)),
 | 
			
		||||
          sample_rate(sample_rate), channel_count(channel_count) {
 | 
			
		||||
        // clang-format off
 | 
			
		||||
        static const FunctionInfo functions[] = {
 | 
			
		||||
            {0, &IHardwareOpusDecoderManager::DecodeInterleaved, "DecodeInterleaved"},
 | 
			
		||||
            {0, &IHardwareOpusDecoderManager::DecodeInterleavedOld, "DecodeInterleavedOld"},
 | 
			
		||||
            {1, nullptr, "SetContext"},
 | 
			
		||||
            {2, nullptr, "DecodeInterleavedForMultiStream"},
 | 
			
		||||
            {2, nullptr, "DecodeInterleavedForMultiStreamOld"},
 | 
			
		||||
            {3, nullptr, "SetContextForMultiStream"},
 | 
			
		||||
            {4, &IHardwareOpusDecoderManager::DecodeInterleavedWithPerformance,
 | 
			
		||||
             "DecodeInterleavedWithPerformance"},
 | 
			
		||||
            {5, nullptr, "Unknown5"},
 | 
			
		||||
            {6, nullptr, "Unknown6"},
 | 
			
		||||
            {7, nullptr, "Unknown7"},
 | 
			
		||||
            {4, &IHardwareOpusDecoderManager::DecodeInterleavedWithPerfOld, "DecodeInterleavedWithPerfOld"},
 | 
			
		||||
            {5, nullptr, "DecodeInterleavedForMultiStreamWithPerfOld"},
 | 
			
		||||
            {6, &IHardwareOpusDecoderManager::DecodeInterleaved, "DecodeInterleaved"},
 | 
			
		||||
            {7, nullptr, "DecodeInterleavedForMultiStream"},
 | 
			
		||||
        };
 | 
			
		||||
        // clang-format on
 | 
			
		||||
 | 
			
		||||
        RegisterHandlers(functions);
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
private:
 | 
			
		||||
    /// Describes extra behavior that may be asked of the decoding context.
 | 
			
		||||
    enum class ExtraBehavior {
 | 
			
		||||
        /// No extra behavior.
 | 
			
		||||
        None,
 | 
			
		||||
 | 
			
		||||
        /// Resets the decoder context back to a freshly initialized state.
 | 
			
		||||
        ResetContext,
 | 
			
		||||
    };
 | 
			
		||||
 | 
			
		||||
    void DecodeInterleavedOld(Kernel::HLERequestContext& ctx) {
 | 
			
		||||
        LOG_DEBUG(Audio, "called");
 | 
			
		||||
 | 
			
		||||
        DecodeInterleavedHelper(ctx, nullptr, ExtraBehavior::None);
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    void DecodeInterleavedWithPerfOld(Kernel::HLERequestContext& ctx) {
 | 
			
		||||
        LOG_DEBUG(Audio, "called");
 | 
			
		||||
 | 
			
		||||
        u64 performance = 0;
 | 
			
		||||
        DecodeInterleavedHelper(ctx, &performance, ExtraBehavior::None);
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    void DecodeInterleaved(Kernel::HLERequestContext& ctx) {
 | 
			
		||||
        LOG_DEBUG(Audio, "called");
 | 
			
		||||
 | 
			
		||||
        u32 consumed = 0;
 | 
			
		||||
        u32 sample_count = 0;
 | 
			
		||||
        std::vector<opus_int16> samples(ctx.GetWriteBufferSize() / sizeof(opus_int16));
 | 
			
		||||
        if (!Decoder_DecodeInterleaved(consumed, sample_count, ctx.ReadBuffer(), samples)) {
 | 
			
		||||
            LOG_ERROR(Audio, "Failed to decode opus data");
 | 
			
		||||
            IPC::ResponseBuilder rb{ctx, 2};
 | 
			
		||||
            // TODO(ogniK): Use correct error code
 | 
			
		||||
            rb.Push(ResultCode(-1));
 | 
			
		||||
            return;
 | 
			
		||||
        }
 | 
			
		||||
        IPC::ResponseBuilder rb{ctx, 4};
 | 
			
		||||
        rb.Push(RESULT_SUCCESS);
 | 
			
		||||
        rb.Push<u32>(consumed);
 | 
			
		||||
        rb.Push<u32>(sample_count);
 | 
			
		||||
        ctx.WriteBuffer(samples.data(), samples.size() * sizeof(s16));
 | 
			
		||||
        IPC::RequestParser rp{ctx};
 | 
			
		||||
        const auto extra_behavior =
 | 
			
		||||
            rp.Pop<bool>() ? ExtraBehavior::ResetContext : ExtraBehavior::None;
 | 
			
		||||
 | 
			
		||||
        u64 performance = 0;
 | 
			
		||||
        DecodeInterleavedHelper(ctx, &performance, extra_behavior);
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    void DecodeInterleavedWithPerformance(Kernel::HLERequestContext& ctx) {
 | 
			
		||||
        LOG_DEBUG(Audio, "called");
 | 
			
		||||
 | 
			
		||||
    void DecodeInterleavedHelper(Kernel::HLERequestContext& ctx, u64* performance,
 | 
			
		||||
                                 ExtraBehavior extra_behavior) {
 | 
			
		||||
        u32 consumed = 0;
 | 
			
		||||
        u32 sample_count = 0;
 | 
			
		||||
        u64 performance = 0;
 | 
			
		||||
        std::vector<opus_int16> samples(ctx.GetWriteBufferSize() / sizeof(opus_int16));
 | 
			
		||||
 | 
			
		||||
        if (extra_behavior == ExtraBehavior::ResetContext) {
 | 
			
		||||
            ResetDecoderContext();
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        if (!Decoder_DecodeInterleaved(consumed, sample_count, ctx.ReadBuffer(), samples,
 | 
			
		||||
                                       performance)) {
 | 
			
		||||
            LOG_ERROR(Audio, "Failed to decode opus data");
 | 
			
		||||
@@ -80,25 +97,28 @@ private:
 | 
			
		||||
            rb.Push(ResultCode(-1));
 | 
			
		||||
            return;
 | 
			
		||||
        }
 | 
			
		||||
        IPC::ResponseBuilder rb{ctx, 6};
 | 
			
		||||
 | 
			
		||||
        const u32 param_size = performance != nullptr ? 6 : 4;
 | 
			
		||||
        IPC::ResponseBuilder rb{ctx, param_size};
 | 
			
		||||
        rb.Push(RESULT_SUCCESS);
 | 
			
		||||
        rb.Push<u32>(consumed);
 | 
			
		||||
        rb.Push<u32>(sample_count);
 | 
			
		||||
        rb.Push<u64>(performance);
 | 
			
		||||
        if (performance) {
 | 
			
		||||
            rb.Push<u64>(*performance);
 | 
			
		||||
        }
 | 
			
		||||
        ctx.WriteBuffer(samples.data(), samples.size() * sizeof(s16));
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    bool Decoder_DecodeInterleaved(
 | 
			
		||||
        u32& consumed, u32& sample_count, const std::vector<u8>& input,
 | 
			
		||||
        std::vector<opus_int16>& output,
 | 
			
		||||
        std::optional<std::reference_wrapper<u64>> performance_time = std::nullopt) {
 | 
			
		||||
    bool Decoder_DecodeInterleaved(u32& consumed, u32& sample_count, const std::vector<u8>& input,
 | 
			
		||||
                                   std::vector<opus_int16>& output, u64* out_performance_time) {
 | 
			
		||||
        const auto start_time = std::chrono::high_resolution_clock::now();
 | 
			
		||||
        std::size_t raw_output_sz = output.size() * sizeof(opus_int16);
 | 
			
		||||
        const std::size_t raw_output_sz = output.size() * sizeof(opus_int16);
 | 
			
		||||
        if (sizeof(OpusHeader) > input.size()) {
 | 
			
		||||
            LOG_ERROR(Audio, "Input is smaller than the header size, header_sz={}, input_sz={}",
 | 
			
		||||
                      sizeof(OpusHeader), input.size());
 | 
			
		||||
            return false;
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        OpusHeader hdr{};
 | 
			
		||||
        std::memcpy(&hdr, input.data(), sizeof(OpusHeader));
 | 
			
		||||
        if (sizeof(OpusHeader) + static_cast<u32>(hdr.sz) > input.size()) {
 | 
			
		||||
@@ -106,8 +126,9 @@ private:
 | 
			
		||||
                      sizeof(OpusHeader) + static_cast<u32>(hdr.sz), input.size());
 | 
			
		||||
            return false;
 | 
			
		||||
        }
 | 
			
		||||
        auto frame = input.data() + sizeof(OpusHeader);
 | 
			
		||||
        auto decoded_sample_count = opus_packet_get_nb_samples(
 | 
			
		||||
 | 
			
		||||
        const auto frame = input.data() + sizeof(OpusHeader);
 | 
			
		||||
        const auto decoded_sample_count = opus_packet_get_nb_samples(
 | 
			
		||||
            frame, static_cast<opus_int32>(input.size() - sizeof(OpusHeader)),
 | 
			
		||||
            static_cast<opus_int32>(sample_rate));
 | 
			
		||||
        if (decoded_sample_count * channel_count * sizeof(u16) > raw_output_sz) {
 | 
			
		||||
@@ -117,8 +138,9 @@ private:
 | 
			
		||||
                decoded_sample_count * channel_count * sizeof(u16), raw_output_sz);
 | 
			
		||||
            return false;
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        const int frame_size = (static_cast<int>(raw_output_sz / sizeof(s16) / channel_count));
 | 
			
		||||
        auto out_sample_count =
 | 
			
		||||
        const auto out_sample_count =
 | 
			
		||||
            opus_decode(decoder.get(), frame, hdr.sz, output.data(), frame_size, 0);
 | 
			
		||||
        if (out_sample_count < 0) {
 | 
			
		||||
            LOG_ERROR(Audio,
 | 
			
		||||
@@ -127,16 +149,24 @@ private:
 | 
			
		||||
                      out_sample_count, frame_size, static_cast<u32>(hdr.sz));
 | 
			
		||||
            return false;
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        const auto end_time = std::chrono::high_resolution_clock::now() - start_time;
 | 
			
		||||
        sample_count = out_sample_count;
 | 
			
		||||
        consumed = static_cast<u32>(sizeof(OpusHeader) + hdr.sz);
 | 
			
		||||
        if (performance_time.has_value()) {
 | 
			
		||||
            performance_time->get() =
 | 
			
		||||
        if (out_performance_time != nullptr) {
 | 
			
		||||
            *out_performance_time =
 | 
			
		||||
                std::chrono::duration_cast<std::chrono::milliseconds>(end_time).count();
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        return true;
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    void ResetDecoderContext() {
 | 
			
		||||
        ASSERT(decoder != nullptr);
 | 
			
		||||
 | 
			
		||||
        opus_decoder_ctl(decoder.get(), OPUS_RESET_STATE);
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    struct OpusHeader {
 | 
			
		||||
        u32_be sz; // Needs to be BE for some odd reason
 | 
			
		||||
        INSERT_PADDING_WORDS(1);
 | 
			
		||||
@@ -157,6 +187,7 @@ void HwOpus::GetWorkBufferSize(Kernel::HLERequestContext& ctx) {
 | 
			
		||||
    IPC::RequestParser rp{ctx};
 | 
			
		||||
    const auto sample_rate = rp.Pop<u32>();
 | 
			
		||||
    const auto channel_count = rp.Pop<u32>();
 | 
			
		||||
 | 
			
		||||
    LOG_DEBUG(Audio, "called with sample_rate={}, channel_count={}", sample_rate, channel_count);
 | 
			
		||||
 | 
			
		||||
    ASSERT_MSG(sample_rate == 48000 || sample_rate == 24000 || sample_rate == 16000 ||
 | 
			
		||||
@@ -174,9 +205,10 @@ void HwOpus::GetWorkBufferSize(Kernel::HLERequestContext& ctx) {
 | 
			
		||||
 | 
			
		||||
void HwOpus::OpenOpusDecoder(Kernel::HLERequestContext& ctx) {
 | 
			
		||||
    IPC::RequestParser rp{ctx};
 | 
			
		||||
    auto sample_rate = rp.Pop<u32>();
 | 
			
		||||
    auto channel_count = rp.Pop<u32>();
 | 
			
		||||
    auto buffer_sz = rp.Pop<u32>();
 | 
			
		||||
    const auto sample_rate = rp.Pop<u32>();
 | 
			
		||||
    const auto channel_count = rp.Pop<u32>();
 | 
			
		||||
    const auto buffer_sz = rp.Pop<u32>();
 | 
			
		||||
 | 
			
		||||
    LOG_DEBUG(Audio, "called sample_rate={}, channel_count={}, buffer_size={}", sample_rate,
 | 
			
		||||
              channel_count, buffer_sz);
 | 
			
		||||
 | 
			
		||||
@@ -185,8 +217,9 @@ void HwOpus::OpenOpusDecoder(Kernel::HLERequestContext& ctx) {
 | 
			
		||||
               "Invalid sample rate");
 | 
			
		||||
    ASSERT_MSG(channel_count == 1 || channel_count == 2, "Invalid channel count");
 | 
			
		||||
 | 
			
		||||
    std::size_t worker_sz = WorkerBufferSize(channel_count);
 | 
			
		||||
    const std::size_t worker_sz = WorkerBufferSize(channel_count);
 | 
			
		||||
    ASSERT_MSG(buffer_sz >= worker_sz, "Worker buffer too large");
 | 
			
		||||
 | 
			
		||||
    std::unique_ptr<OpusDecoder, OpusDeleter> decoder{
 | 
			
		||||
        static_cast<OpusDecoder*>(operator new(worker_sz))};
 | 
			
		||||
    if (const int err = opus_decoder_init(decoder.get(), sample_rate, channel_count)) {
 | 
			
		||||
 
 | 
			
		||||
		Reference in New Issue
	
	Block a user