c++ - Decoding an MKA audio file into raw data(MKA Audio to raw audio data)-6ren

c++ - Decoding an MKA audio file into raw data(MKA Audio to raw audio data)

转载作者：行者123 更新时间：2023-12-02 22:15:01

我的任务是打开一个扩展名为 mka 的现有音频文件(Matroska 容器)并提取原始音频数据。 This示例仅显示了从 mp2 文件中提取原始数据的示例。我不知道如何使用 mka 容器执行此操作。我想要这样的东西:

UPD

我发现一个选项可以以音频文件中记录的格式保存音频数据。示例如下所示。

附言。这只是一个测试版本，很可能存在内存泄漏和其他问题。


#include <QFile>
#include <QDebug>
#include "audiodecoder.h"

int main(int argc, char* argv[])
{
    AudioDecoder decoder("/home/test/test.mka");
    bool started = decoder.start();
    if (!started) {
        return EXIT_FAILURE;
    }

    QFile file("/home/test/rawData.bin");
    file.open(QIODevice::WriteOnly);

    while (true) {
        auto data = decoder.getData(255);
        if (data.isEmpty()) {
            break;
        }
        file.write(data.data(), data.size());
    }
    file.close();
    return EXIT_SUCCESS;
}

audiodecoder.h

class AudioDecoder {
public:
    AudioDecoder(const QString& fileName);
    AudioDecoder& operator=(const AudioDecoder& rhs) = delete;
    AudioDecoder& operator=(AudioDecoder&& rhs) = delete;
    AudioDecoder(const AudioDecoder& rhs) = delete;
    AudioDecoder(AudioDecoder&& rhs) = delete;
    virtual ~AudioDecoder(void);

    virtual bool start(void) noexcept;
    virtual QByteArray getData(const quint16& size) noexcept;
    virtual bool stop(void) noexcept;

protected:
    bool m_initialized;
    QString m_fileName;

    AVFrame* p_frame = nullptr;
    AVPacket* p_packet = nullptr;
    AVCodecContext* p_cdcCtx = nullptr;
    AVFormatContext* p_frmCtx = nullptr;
};

audiodecoder.cpp


static void logging(const char* message)
{
    qDebug() << message;
}

AudioDecoder::AudioDecoder(const QString& fileName)
    : m_initialized(false)
    , m_fileName(fileName)
    , p_cdcCtx(nullptr)
    , p_frmCtx(nullptr)
{
    av_register_all();
}

QByteArray AudioDecoder::getData(const quint16& dataSize) noexcept
{
    QByteArray data;
    qint32 response = 0;
    if (av_read_frame(p_frmCtx, p_packet) >= 0) {
        //logging(QString("AVPacket->pts %1").arg(p_packet->pts).toStdString().c_str());
        //response = decode_packet(p_packet, p_cdcCtx, p_frame);
        response = avcodec_send_packet(p_cdcCtx, p_packet);
        if (response < 0) {
            logging("Error while sending a packet to the decoder");
            return {};
        }
        while (response >= 0) {
            response = avcodec_receive_frame(p_cdcCtx, p_frame);
            if (response == AVERROR(EAGAIN) || response == AVERROR_EOF) {
                break;
            }
            else if (response < 0) {
                logging("Error while receiving a frame from the decoder");
                return {};
            }
            if (response >= 0) {
                logging(QString("Frame %1 (type=%2, size=%3 bytes) pts %4 key_frame %5 [DTS %6], duration[%7]")
                            .arg(p_cdcCtx->frame_number)
                            .arg(av_get_picture_type_char(p_frame->pict_type))
                            .arg(p_frame->pkt_size)
                            .arg(p_frame->pts)
                            .arg(p_frame->key_frame)
                            .arg(p_frame->coded_picture_number)
                            .arg(p_frame->pkt_duration)
                            .toStdString()
                            .c_str());

                for (int i = 0; i < p_frame->linesize[0]; ++i) {
                    data.push_back(p_frame->data[0][i]);
                }
            }
        }
        av_packet_unref(p_packet);
        return data;
    }
    return {};
}

bool AudioDecoder::start(void) noexcept
{
    if (m_initialized) {
        return true;
    }

    int error;
    // Open the input file to read from it.
    if ((error = avformat_open_input(&p_frmCtx,
             m_fileName.toStdString().c_str(), nullptr, nullptr))
        < 0) {
        qDebug() << "Could not open input file: " << m_fileName;
        p_frmCtx = nullptr;
        return false;
    }
    // Get information on the input file (number of streams etc.).
    if ((error = avformat_find_stream_info(p_frmCtx, nullptr)) < 0) {
        avformat_close_input(&p_frmCtx);
        qDebug() << __LINE__;
        return false;
    }
    // Make sure that there is only one stream in the input file.
    if ((p_frmCtx)->nb_streams != 1) {
        avformat_close_input(&p_frmCtx);
        qDebug() << __LINE__;
        return false;
    }

    if (p_frmCtx->streams[0]->codecpar->codec_type != AVMEDIA_TYPE_AUDIO) {
        avformat_close_input(&p_frmCtx);
        qDebug() << __LINE__;
        return false;
    }

    // Find a decoder for the audio stream.
    AVCodec* input_codec = nullptr;
    if (!(input_codec = avcodec_find_decoder((p_frmCtx)->streams[0]->codecpar->codec_id))) {
        avformat_close_input(&p_frmCtx);
        qDebug() << __LINE__;
        return false;
    }
    // Allocate a new decoding context.
    AVCodecContext* avctx = avcodec_alloc_context3(input_codec);
    if (!avctx) {
        avformat_close_input(&p_frmCtx);
        qDebug() << __LINE__;
        return false;
    }
    // Initialize the stream parameters with demuxer information.
    error = avcodec_parameters_to_context(avctx, (p_frmCtx)->streams[0]->codecpar);
    if (error < 0) {
        avformat_close_input(&p_frmCtx);
        avcodec_free_context(&avctx);
        qDebug() << __LINE__;
        return false;
    }
    /* Open the decoder for the audio stream to use it later. */
    if ((error = avcodec_open2(avctx, input_codec, NULL)) < 0) {
        avcodec_free_context(&avctx);
        avformat_close_input(&p_frmCtx);
        qDebug() << __LINE__;
        return false;
    }
    /* Save the decoder context for easier access later. */
    p_cdcCtx = avctx;
    av_dump_format(p_frmCtx, 0, m_fileName.toStdString().c_str(), 0);

    p_frame = av_frame_alloc();
    if (!p_frame) {
        logging("failed to allocated memory for AVFrame");
        return false;
    }
    p_packet = av_packet_alloc();
    if (!p_packet) {
        logging("failed to allocated memory for AVPacket");
        return false;
    }
    return m_initialized = true;
}

bool AudioDecoder::stop(void) noexcept
{
    if (p_cdcCtx != nullptr) {
        avcodec_free_context(&p_cdcCtx);
    }
    if (p_frmCtx != nullptr) {
        avformat_close_input(&p_frmCtx);
    }
    return true;
}

AudioDecoder::~AudioDecoder(void)
{
    stop();
}

但是这个例子中的问题是我没有实现准确获取请求的音频数据大小的能力。就我而言，它只是被忽略了。

最佳答案

如果您想提取以您从音频文件中获取的格式编码的音频数据，那么您应该查看 this例子。在此示例中，您需要将输出类型从 acc 更改为 alaw。压缩流将在 AVPacket::buf 中:

A reference to the reference-counted buffer where the packet data is stored.

我还建议查看 this文章。它会帮助你:)

关于c++ - Decoding an MKA audio file into raw data(MKA Audio to raw audio data)，我们在Stack Overflow上找到一个类似的问题： https://stackoverflow.com/questions/64119093/

文章推荐： audio - 低功耗蓝牙中的语音功能选项

文章推荐： javascript - 将数组中的所有数字填充到随机 div 中

文章推荐： ios - 广告后，声音在游戏中消失

file - access to file to files tomcat的conf文件夹下的一个文件
我想知道是否可以访问放在 tomcat 的 conf 文件夹中的文件。通常我会在这个文件中放置多个 webapp 的配置，在 war 之外。我想使用类路径独立于文件系统。我过去使用过 lib 文件
PowerShell ForEach $file in $Files 中的每个 $file
我有一个 PowerShell 脚本，它获取文件列表并移动满足特定条件的文件。为什么即使对象为空，foreach 循环也会运行？我假设如果 $i 不存在，它就不会运行。但是如果 $filePath
java - File file = new File () 的路径错误
我已将 BasicAccountRule.drl 放置在我的 Web 应用程序中，位置为:C:/workspace/exim_design/src/main/resources/rules/drl/i
ruby - File.open ('file.txt' ) 与 File.open ('file.txt' ).readlines
我使用 File.open('file.txt').class 和 File.open('file.txt').readlines.class 以及前者进行了检查一个返回 File，后者返回 Arra
java - 即使 file.exists()、file.canRead()、file.canWrite()、file.canExecute() 都返回 true，file.delete() 也会返回 false
我正在尝试使用 FileOutputStream 删除文件，在其中写入内容后。这是我用来编写的代码: private void writeContent(File file, String fileC
python - FileNotFoundException :File file:/path/to/file/in. txt不存在或者运行Flink的用户没有足够的权限访问它
我正在尝试使用 flink 和 python 批处理 api 测试 Wordcount 经典示例。我的问题是，将数据源从 env.from_elements() 修改为 env.read_text()
c - 通过函数 : FILE* or FILE**? 的 FILE* 数组
我正在尝试制作一个可以同时处理多个不同文件的程序。我的想法是制作一个包含 20 个 FILE* 的数组，以便在我达到此限制时能够关闭其中一个并打开请求的新文件。为此，我想到了一个函数，它选择一个选项
linux - 狂欢 : Search Contents of File A in File B and Print lines of File A in File C
我有两个文件A和B文件A: 976464 792992 文件B TimeStamp,Record1,976464,8383,ABCD 我想搜索文件 A 和文件 B 中的每条记录并打印匹配的记录。打印的
java - 使用 Java 8 流将 Map 转换为 Map>
我有一些保存在 map 中的属性文件。示例: Map map = new HashMap<>(); map.put("1", "One"); map.put("2", "Two"); map.put(
file - Unix/庆典 : Reading A List of Files and Merge Them To A File
我正在尝试找出一个脚本文件，该文件接受一个包含文件列表的文件(每一行都是一个文件路径，即 path/to/file)并将它们合并到一个文件中。例如: list.text -- path/to/fil
c# - File.CreateText/File.AppendText 与 File.AppendAllText
为了使用 File.CreateText() 和 File.AppendText() 你必须: 通过调用这些方法之一打开流写消息关闭流处理流为了使用 File.AppendAllText()
Using rsync to rename files during copying with --files-from?(在复制过程中使用rsync重命名文件--files-from？)
使用rsync时，如何在使用--files-from参数复制时重命名文件？我有大约190，000个文件，在从源复制到目标时，每个文件都需要重命名。我计划将文件列表放在一个文本文件中传递给--files
java - "file:d:\\dir1\file.xml"和 "file:/d:\\dir1\file.xml"作为 FileSystemXmlApplicationContext 参数
我在非服务器应用程序中使用 Spring(只需从 Eclipse 中某个类的 main() 编译并运行它)。我的问题是作为 new FileSystemXmlApplicationContext 的
ksh - "test -a file"和 "test file -ef file"的区别
QNX (Neutrino 6.5.0) 使用 ksh 的开源实现作为其 shell 。许多提供的脚本，包括系统启动脚本，都使用诸如 if ! test /dev/slog -ef /dev/slog
PHP : Excel cannot open the file because the file format or file extension is not valid
当我尝试打开从我的应用程序下载的 xls 文件时，出现此错误: excel cannot open the file because the file format or file extension
c - "file pointer"、 "stream"、 "file descriptor"和... "file"之间的区别？
有一些相关的概念，即文件指针、流和文件描述符。我知道文件指针是指向数据类型 FILE 的指针(在例如 FILE.h 和 struct_FILE.h 中声明)。我知道文件描述符是 int ，例如成员
file - Groovy(文件IO): find all files and return all files - the Groovy way
好吧，这应该很容易... 我是groovy的新手，我希望实现以下逻辑: def testFiles = findAllTestFiles(); 到目前为止，我想出了下面的代码，该代码可以成功打印所有文
PowerShell:为什么 "Get-Content | Out-File -Append "会进入循环？
我理解为什么以下内容会截断文件的内容: Get-Content | Out-File 这是因为 Out-File 首先运行，它会在 Get-Content 有机会读取文件之前清空文件。但是当我尝
file - 类型错误 : invalid file: When trying to make a file name a variable
您好，我正在尝试将文件位置表示为变量，因为最终脚本将在另一台机器上运行。这是我尝试过的代码，然后是我得到的错误。在我看来，python 是如何添加“\”的，这就是导致问题的原因。如果是这种情况，我如何
bash - 一行文件的 "$(cat file)"、 "$(
我有一个只包含一行的输入文件: $ cat input foo bar 我想在我的脚本中使用这一行，据我所知有 3 种方法: line=$(cat input) line=$( input"...,

行者123

个人简介

我是一名优秀的程序员,十分优秀！

作者热门文章

滴滴打车优惠券免费领取

全站热门文章

首页

博学

6Ren·AI

商城

c++ - Decoding an MKA audio file into raw data(MKA Audio to raw audio data)