Android Opensles 使用 FFmpeg 重采样 PCM-6ren

Android Opensles 使用 FFmpeg 重采样 PCM

转载作者：太空狗更新时间：2023-10-29 15:08:43

我正在尝试在 android 中使用 ffmpeg 和 opensles 播放音频流。问题似乎出在将解码和重采样的帧从 ffmpeg 传递到 opensles 时，因为我听到的声音听起来很机械并且有刮痕。

来自 ffmpeg 的解码帧:

PCM
48000 Hz
S16p

Opensles 在这种情况下需要:

PCM
48000 Hz
S16

Opensles 设置:

SLDataLocator_AndroidSimpleBufferQueue loc_bufq = {SL_DATALOCATOR_ANDROIDSIMPLEBUFFERQUEUE, 255};

SLDataFormat_PCM format_pcm = { SL_DATAFORMAT_PCM, 2 , SL_SAMPLINGRATE_48, SL_PCMSAMPLEFORMAT_FIXED_16, SL_PCMSAMPLEFORMAT_FIXED_16,
                SL_SPEAKER_FRONT_LEFT | SL_SPEAKER_FRONT_RIGHT, SL_BYTEORDER_LITTLEENDIAN};

SLDataSource audioSrc = {&loc_bufq, &format_pcm};

这是重新采样和入队到 opensles 的伪代码:

#define OPENSLES_BUFLEN 10
#define MAX_AUDIO_FRAME_SIZE 192000

DECLARE_ALIGNED(16,uint8_t,audio_buffer)[MAX_AUDIO_FRAME_SIZE * OPENSLES_BUFLEN];


int decode_audio(AVCodecContext * ctx, SwrContext *swr_context, AVPacket *packet, AVFrame * frame){
    int got_frame_ptr;
    int len = avcodec_decode_audio4(ctx, frame, &got_frame_ptr, packet);

    if(!got_frame_ptr)
        return -ERROR;

    int original_data_size = av_samples_get_buffer_size(NULL, ctx->channels,
        frame->nb_samples, ctx->sample_fmt, 1);

    uint8_t *audio_buf;
    int data_size;

    if (swr_context != NULL) {
        uint8_t *out[] = { audio_buffer };

        int sample_per_buffer_divider = 2* av_get_bytes_per_sample(AV_SAMPLE_FMT_S16);;


        int len2 = swr_convert(swr_context, out,
            sizeof(audio_buffer) / sample_per_buffer_divider,
            frame->extended_data, frame->nb_samples);



        if (len2 < 0) {
            return -ERROR;
        }
        if (len2 == sizeof(audio_buffer) / sample_per_buffer_divider) {
            swr_init(swr_context);
        }
        audio_buf = audio_buffer;
        data_size = len2 * sample_per_buffer_divider;
        } 
     else {
        audio_buf = frame->data[0];
        data_size = original_data_size;
     }

     (*opengSLESData->bqPlayerBufferQueue)->Enqueue(opengSLESData->bqPlayerBufferQueue, audio_buf, data_size)


}

如果有任何帮助，我将不胜感激。

最佳答案

例子可能有帮助

#include "stdafx.h"
#include <iostream>

extern "C"
{
#include "libavcodec/avcodec.h"
#include "libavformat/avformat.h"
//#include "swscale.h"
#include "libswresample/swresample.h"
};

FILE           *fin,    *fout;

int ffmpeg_audio_decode( const char * inFile, const char * outFile)
{
// Initialize FFmpeg
av_register_all();

AVFrame* frame = avcodec_alloc_frame();
if (!frame)
{
    std::cout << "Error allocating the frame" << std::endl;
    return 1;
}

// you can change the file name "01 Push Me to the Floor.wav" to whatever the file is you're reading, like "myFile.ogg" or
// "someFile.webm" and this should still work
AVFormatContext* formatContext = NULL;
//if (avformat_open_input(&formatContext, "01 Push Me to the Floor.wav", NULL, NULL) != 0)
if (avformat_open_input(&formatContext, inFile, NULL, NULL) != 0)
{
    av_free(frame);
    std::cout << "Error opening the file" << std::endl;
    return 1;
}

if (avformat_find_stream_info(formatContext, NULL) < 0)
{
    av_free(frame);
    av_close_input_file(formatContext);
    std::cout << "Error finding the stream info" << std::endl;
    return 1;
}

AVStream* audioStream = NULL;
// Find the audio stream (some container files can have multiple streams in them)
for (unsigned int i = 0; i < formatContext->nb_streams; ++i)
{
    if (formatContext->streams[i]->codec->codec_type == AVMEDIA_TYPE_AUDIO)
    {
        audioStream = formatContext->streams[i];
        break;
    }
}

if (audioStream == NULL)
{
    av_free(frame);
    av_close_input_file(formatContext);
    std::cout << "Could not find any audio stream in the file" << std::endl;
    return 1;
}

AVCodecContext* codecContext = audioStream->codec;

codecContext->codec = avcodec_find_decoder(codecContext->codec_id);
if (codecContext->codec == NULL)
{
    av_free(frame);
    av_close_input_file(formatContext);
    std::cout << "Couldn't find a proper decoder" << std::endl;
    return 1;
}
else if (avcodec_open2(codecContext, codecContext->codec, NULL) != 0)
{
    av_free(frame);
    av_close_input_file(formatContext);
    std::cout << "Couldn't open the context with the decoder" << std::endl;
    return 1;
}

std::cout << "This stream has " << codecContext->channels << " channels and a sample rate of " << codecContext->sample_rate << "Hz" << std::endl;
std::cout << "The data is in the format " << av_get_sample_fmt_name(codecContext->sample_fmt) << std::endl;

//codecContext->sample_fmt = AV_SAMPLE_FMT_S16;

int64_t outChannelLayout = AV_CH_LAYOUT_MONO; //AV_CH_LAYOUT_STEREO;
AVSampleFormat outSampleFormat = AV_SAMPLE_FMT_S16; // Packed audio, non-planar (this is the most common format, and probably what you want; also, WAV needs it)
int outSampleRate = 8000;//44100;
// Note that AVCodecContext::channel_layout may or may not be set by libavcodec. Because of this,
// we won't use it, and will instead try to guess the layout from the number of channels.
SwrContext* swrContext = swr_alloc_set_opts(NULL,
    outChannelLayout,
    outSampleFormat,
    outSampleRate,
    av_get_default_channel_layout(codecContext->channels),
    codecContext->sample_fmt,
    codecContext->sample_rate,
    0,
    NULL);

if (swrContext == NULL)
{
    av_free(frame);
    avcodec_close(codecContext);
    avformat_close_input(&formatContext);
    std::cout << "Couldn't create the SwrContext" << std::endl;
    return 1;
}

if (swr_init(swrContext) != 0)
{
    av_free(frame);
    avcodec_close(codecContext);
    avformat_close_input(&formatContext);
    swr_free(&swrContext);
    std::cout << "Couldn't initialize the SwrContext" << std::endl;
    return 1;
}

fout = fopen(outFile, "wb+");

AVPacket packet;
av_init_packet(&packet);

// Read the packets in a loop
while (av_read_frame(formatContext, &packet) == 0)
{
    if (packet.stream_index == audioStream->index)
    {
        AVPacket decodingPacket = packet;

        while (decodingPacket.size > 0)
        {
            // Try to decode the packet into a frame
            int frameFinished = 0;
            int result = avcodec_decode_audio4(
                codecContext, 
                frame, 
                &frameFinished, 
                &decodingPacket);

            if (result < 0 || frameFinished == 0)
            {
                break;
            }

            unsigned char buffer[100000] = {NULL};
            unsigned char* pointers[SWR_CH_MAX] = {NULL};
            pointers[0] = &buffer[0];

            int numSamplesOut = swr_convert(
                swrContext,
                pointers,
                outSampleRate,
                (const unsigned char**)frame->extended_data,
                frame->nb_samples);


            fwrite(  
                (short *)buffer, 
                sizeof(short), 
                (size_t)numSamplesOut, 
                fout);

            decodingPacket.size -= result;
            decodingPacket.data += result;
        }

    }

    // You *must* call av_free_packet() after each call to av_read_frame() or else you'll leak memory
    av_free_packet(&packet);
}

// Some codecs will cause frames to be buffered up in the decoding process. If the CODEC_CAP_DELAY flag
// is set, there can be buffered up frames that need to be flushed, so we'll do that
if (codecContext->codec->capabilities & CODEC_CAP_DELAY)
{
    av_init_packet(&packet);
    // Decode all the remaining frames in the buffer, until the end is reached
    int frameFinished = 0;
    while (avcodec_decode_audio4(codecContext, frame, &frameFinished, &packet) >= 0 && frameFinished)
    {
    }
}

// Clean up!
av_free(frame);
avcodec_close(codecContext);
av_close_input_file(formatContext);
fclose(fout);
}

关于Android Opensles 使用 FFmpeg 重采样 PCM，我们在Stack Overflow上找到一个类似的问题： https://stackoverflow.com/questions/19066162/

文章推荐： c - Linux“apt-get更新”工作流程

文章推荐： jquery alt Accordion 不关闭

文章推荐： javascript - Phonegap 如何重用/包含 HTML 页面？

ffmpeg - ffmpeg 无法识别记录在案的 ffmpeg 命令
我正在尝试使用 ldash 等选项和 http_opts ，正如 dash muxer 文档所描述的，但 FFmpeg 无法识别它们。我正在使用最新发布的 ffmpeg v4.2.2 版本。我在 ff
ffmpeg - 是否有某种 ffmpeg 输出转换为 ffmpeg 命令行？
假设我们有许多想要与 -vcodec 副本(或等效语法)合并的视频记录。无需重新编码，不会损失质量。并且很少有记录(minor set)，有另外的编解码器，参数等等。所以我们可以使用 ffprobe
ffmpeg - 安装错误: No such file or directory: 'ffmpeg' : 'ffmpeg'
有没有办法安装 ffmpeg 没有root访问权限？使用 ./configure 无法做到这一点来自 git 克隆 git://source.FFmpeg.org/fFFmpeg.git 最佳答案是
ffmpeg - 直接使用 FFmpeg 与使用 Ffmpeg 命令行的应用程序有什么区别？
在应用程序中直接使用 FFmpeg 与使用 Ffmpeg 命令行有什么区别？最佳答案没有:FFmpeg 命令行只是一个使用 FFmpeg API 的应用程序。当然，在使用该应用程序时，您仅限于已实
ffmpeg - 有没有办法使用各种 ffmpeg 命令找出 ffmpeg 在我的系统中的性能是否最佳？
我正在使用以下命令对文件(下面的媒体信息)进行编码: ffmpeg -i AHomeMovie.mkv -map 0 -c copy -c:v libx264 -preset veryslow -cr
ffmpeg - 为 ffmpeg 视频添加边框 [ffmpeg-python]
我正在制作一张圣诞贺卡，我需要将视频嵌入到右侧(边框内)的卡片中，并在左侧显示一些文本。为简单起见，假设我有一个带有透明孔的盒子。我想在那个洞里显示视频。我正在使用 ffmpeg-python很高
Laravel FFmpeg 错误调用未定义的方法 FFMpeg\FFMpeg::fromDisk()
我正在使用 laravel ffmpeg 为视频创建缩略图，但是当我运行代码时，它返回给我 Call to undefined method FFMpeg\FFMpeg::fromDisk() 我不知
ffmpeg - ffmpeg 的硬件加速不起作用
我为我的 nvidia 下载了 cuda 驱动程序但它仍然不使用我的 GPU，它仍然使用 cpu。我怎样才能让它使用GPU。我也听说过硬件加速，但那不起作用。它必须是 h.264 最佳答案你
ffmpeg - 剪切多个部分后音频和视频不同步 - FFMPEG
尝试剪切视频的多个部分时，我遵循此问题的解决方案 Cut multiple parts of a video with ffmpeg .但问题是，如果我剪切多次(比如大约 20 次或更多)，视频和音频
ffmpeg - FFMPEG 的免许可编解码器有哪些？
所以我最近开始在我打算在商业上分发的应用程序中实现 ffmpeg。而且我很难理解整个许可过程。我见过的最常回答的问题似乎是关于 x264，它需要 x264.org 的付费许可才能在商业上使用它(对吗
ffmpeg - ffmpeg 代码中是否存在缩短视频时间的因素？
我使用 ffmpeg 更改视频文件的分辨率，转换到另一个位置后，视频持续 0 秒，但最初持续 2 分钟我的ffmepg代码: ffmpeg -i input.mp4 -filter:v scale=
ffmpeg - FFMPEG 不支持加载外部过滤器是否有特定原因？
如上: FFMPEG 不支持在没有第三部分库的情况下加载外部过滤器是否有特定原因？ (像弗莱0r) 我必须重新编译整个包来添加一个新的过滤器! 最佳答案只有开发人员可以肯定地回答，但我会冒安全风险和
ffmpeg - 使用新的编码器编译 FFmpeg
我收到了一个编码器，我需要用 FFMPEG 编译，我是新手，所以我不知道如何用 ffmpeg 添加/编译它。编码器是JSV，我的服务器是ubuntu 14.04。我已经开始阅读这篇 https://
ffmpeg - FFMPEG 的硬件要求
关闭。这个问题不符合Stack Overflow guidelines .它目前不接受答案。我们不允许在 Stack Overflow 上提出有关通用计算硬件和软件的问题。您可以编辑问题，使其成为
ffmpeg - 如何确定某些编解码器和格式之间的转码和重新混合是否可以用于特定版本的 ffmpeg？
我正在制作一个利用 ffmpeg 重新混合和转码视频文件的程序。我想使用 ffmpeg -codecs和 ffmpeg -formats (或通过 ffmpeg 可用的任何其他命令)来检查我可以在哪些
ffmpeg - 移动文本drawtext过滤器的速度 - FFMPEG
这个问题在这里已经有了答案: ffmpeg moving text drawtext (1 个回答) 3年前关闭。我正在使用此命令使用 ffmpeg 将文本从一个地方移动到另一个地方 ffmpeg
ffmpeg - ffmpeg/ffprobe中的持续时间比特率和流比特率有什么区别？
为什么 ffmpeg/ffprobe 为流和整个文件提供不同的比特率值？当我使用 ffprobe 分析 mp3 文件时，它会在第一行和第二行给出不同的比特率。有谁知道，有什么区别？ // File
ffmpeg - FFmpeg 中的多色文本
如何在ffmpeg中使用drawtext在视频上绘制多色文本？示例:我想突出句子中的专有名词， “XYZ公司股价上涨91%” 高亮 XYZ 白色黄色用绿色突出显示 91% 如果您有任何其他方法不
ffmpeg - 如何为您的不和谐机器人安装 FFMPEG？
我想让我的不和谐机器人播放音乐，但我不断收到“找不到 FFMPEG”错误。我的机器人主要是由 ping 制成的，所以我不会上传那部分。音乐代码应该是这个。 const Discord = requi
ffmpeg - ffmpeg drawtext过滤器中的德语变音符号
我需要帮助在 ffmpeg drawtext 过滤器中正确/(完全)显示德语变音符号“äüö”。我现在不能说我的无能是由于缺乏 ffmpeg 专业知识或机器配置，还是两者兼而有之。非常感谢您的意见。

太空狗

个人简介

我是一名优秀的程序员,十分优秀！

作者热门文章

滴滴打车优惠券免费领取

全站热门文章

首页

博学

6Ren·AI

商城

Android Opensles 使用 FFmpeg 重采样 PCM