ios - 无输出的实时音频处理-6ren

ios - 无输出的实时音频处理

转载作者：可可西里更新时间：2023-11-01 03:07:09

我在看这个例子http://teragonaudio.com/article/How-to-do-realtime-recording-with-effect-processing-on-iOS.html

我想关闭我的输出。我尝试将:kAudioSessionCategory_PlayAndRecord 更改为 kAudioSessionCategory_RecordAudio 但这不起作用。我也尝试摆脱:

  if(AudioUnitSetProperty(*audioUnit, kAudioUnitProperty_StreamFormat,
                            kAudioUnitScope_Output, 1, &streamDescription, sizeof(streamDescription)) != noErr) {
        return 1;
    }

因为我想从麦克风中获取声音而不是播放它。但是无论我做什么，当我的声音到达 renderCallback 方法时都会出现 -50 错误。当音频在输出上自动播放时，一切正常......

更新代码:

using namespace std;

AudioUnit *audioUnit = NULL;

float *convertedSampleBuffer = NULL;

int initAudioSession() {
    audioUnit = (AudioUnit*)malloc(sizeof(AudioUnit));

    if(AudioSessionInitialize(NULL, NULL, NULL, NULL) != noErr) {
        return 1;
    }

    if(AudioSessionSetActive(true) != noErr) {
        return 1;
    }

    UInt32 sessionCategory = kAudioSessionCategory_PlayAndRecord;
    if(AudioSessionSetProperty(kAudioSessionProperty_AudioCategory,
                               sizeof(UInt32), &sessionCategory) != noErr) {
        return 1;
    }

    Float32 bufferSizeInSec = 0.02f;
    if(AudioSessionSetProperty(kAudioSessionProperty_PreferredHardwareIOBufferDuration,
                               sizeof(Float32), &bufferSizeInSec) != noErr) {
        return 1;
    }

    UInt32 overrideCategory = 1;
    if(AudioSessionSetProperty(kAudioSessionProperty_OverrideCategoryDefaultToSpeaker,
                               sizeof(UInt32), &overrideCategory) != noErr) {
        return 1;
    }

    // There are many properties you might want to provide callback functions for:
    // kAudioSessionProperty_AudioRouteChange
    // kAudioSessionProperty_OverrideCategoryEnableBluetoothInput
    // etc.

    return 0;
}

OSStatus renderCallback(void *userData, AudioUnitRenderActionFlags *actionFlags,
                        const AudioTimeStamp *audioTimeStamp, UInt32 busNumber,
                        UInt32 numFrames, AudioBufferList *buffers) {
    OSStatus status = AudioUnitRender(*audioUnit, actionFlags, audioTimeStamp,
                                      1, numFrames, buffers);

    int doOutput = 0;

    if(status != noErr) {
        return status;
    }

    if(convertedSampleBuffer == NULL) {
        // Lazy initialization of this buffer is necessary because we don't
        // know the frame count until the first callback
        convertedSampleBuffer = (float*)malloc(sizeof(float) * numFrames);
        baseTime = (float)QRealTimer::getUptimeInMilliseconds();
    }

    SInt16 *inputFrames = (SInt16*)(buffers->mBuffers->mData);

    // If your DSP code can use integers, then don't bother converting to
    // floats here, as it just wastes CPU. However, most DSP algorithms rely
    // on floating point, and this is especially true if you are porting a
    // VST/AU to iOS.

    int i;

    for( i = numFrames; i < fftlength; i++ )        // Shifting buffer
        x_inbuf[i - numFrames] = x_inbuf[i];

    for(  i = 0; i < numFrames; i++) {
        x_inbuf[i + x_phase] = (float)inputFrames[i] / (float)32768;
    }

    if( x_phase + numFrames == fftlength )
    {
        x_alignment.SigProc_frontend(x_inbuf);  // Signal processing front-end (FFT!)
        doOutput = x_alignment.Align();


        /// Output as text! In the real-time version,
        //      this is where we update visualisation callbacks and launch other services
        if ((doOutput) & (x_netscore.isEvent(x_alignment.Position()))
            &(x_alignment.lastAction()<x_alignment.Position()) )
        {
          //  here i want to do something with my input!
        }
    }
    else
        x_phase += numFrames;


   return noErr;
}


int initAudioStreams(AudioUnit *audioUnit) {
    UInt32 audioCategory = kAudioSessionCategory_PlayAndRecord;
    if(AudioSessionSetProperty(kAudioSessionProperty_AudioCategory,
                               sizeof(UInt32), &audioCategory) != noErr) {
        return 1;
    }

    UInt32 overrideCategory = 1;
    if(AudioSessionSetProperty(kAudioSessionProperty_OverrideCategoryDefaultToSpeaker,
                               sizeof(UInt32), &overrideCategory) != noErr) {
        // Less serious error, but you may want to handle it and bail here
    }

    AudioComponentDescription componentDescription;
    componentDescription.componentType = kAudioUnitType_Output;
    componentDescription.componentSubType = kAudioUnitSubType_RemoteIO;
    componentDescription.componentManufacturer = kAudioUnitManufacturer_Apple;
    componentDescription.componentFlags = 0;
    componentDescription.componentFlagsMask = 0;
    AudioComponent component = AudioComponentFindNext(NULL, &componentDescription);
    if(AudioComponentInstanceNew(component, audioUnit) != noErr) {
        return 1;
    }

    UInt32 enable = 1;
    if(AudioUnitSetProperty(*audioUnit, kAudioOutputUnitProperty_EnableIO,
                            kAudioUnitScope_Input, 1, &enable, sizeof(UInt32)) != noErr) {
        return 1;
    }

    AURenderCallbackStruct callbackStruct;
    callbackStruct.inputProc = renderCallback; // Render function
    callbackStruct.inputProcRefCon = NULL;
    if(AudioUnitSetProperty(*audioUnit, kAudioUnitProperty_SetRenderCallback,
                            kAudioUnitScope_Input, 0, &callbackStruct,
                            sizeof(AURenderCallbackStruct)) != noErr) {
        return 1;
    }

    AudioStreamBasicDescription streamDescription;
    // You might want to replace this with a different value, but keep in mind that the
    // iPhone does not support all sample rates. 8kHz, 22kHz, and 44.1kHz should all work.
    streamDescription.mSampleRate = 44100;
    // Yes, I know you probably want floating point samples, but the iPhone isn't going
    // to give you floating point data. You'll need to make the conversion by hand from
    // linear PCM <-> float.
    streamDescription.mFormatID = kAudioFormatLinearPCM;
    // This part is important!
    streamDescription.mFormatFlags = kAudioFormatFlagIsSignedInteger |
    kAudioFormatFlagsNativeEndian |
    kAudioFormatFlagIsPacked;
    streamDescription.mBitsPerChannel = 16;
    // 1 sample per frame, will always be 2 as long as 16-bit samples are being used
    streamDescription.mBytesPerFrame = 2;
    streamDescription.mChannelsPerFrame = 1;
    streamDescription.mBytesPerPacket = streamDescription.mBytesPerFrame *
    streamDescription.mChannelsPerFrame;
    // Always should be set to 1
    streamDescription.mFramesPerPacket = 1;
    // Always set to 0, just to be sure
    streamDescription.mReserved = 0;

    // Set up input stream with above properties
    if(AudioUnitSetProperty(*audioUnit, kAudioUnitProperty_StreamFormat,
                            kAudioUnitScope_Input, 0, &streamDescription, sizeof(streamDescription)) != noErr) {
        return 1;
    }

    // Ditto for the output stream, which we will be sending the processed audio to
    if(AudioUnitSetProperty(*audioUnit, kAudioUnitProperty_StreamFormat,
                            kAudioUnitScope_Output, 1, &streamDescription, sizeof(streamDescription)) != noErr) {
        return 1;
    }

    return 0;
}


int startAudioUnit(AudioUnit *audioUnit) {
    if(AudioUnitInitialize(*audioUnit) != noErr) {
        return 1;
    }

    if(AudioOutputUnitStart(*audioUnit) != noErr) {
        return 1;
    }

    return 0;
}

然后从我的 VC 打电话:

  initAudioSession();
    initAudioStreams( audioUnit);
    startAudioUnit( audioUnit);

最佳答案

如果你只想录制，不想播放，只需注释掉设置 renderCallback 的行:

AURenderCallbackStruct callbackStruct;
callbackStruct.inputProc = renderCallback; // Render function
callbackStruct.inputProcRefCon = NULL;
if(AudioUnitSetProperty(*audioUnit, kAudioUnitProperty_SetRenderCallback,
   kAudioUnitScope_Input, 0, &callbackStruct,
   sizeof(AURenderCallbackStruct)) != noErr) {
  return 1;
}

看到代码后更新:

正如我所怀疑的，您缺少输入回调。添加这些行:

// at top:
#define kInputBus 1

AURenderCallbackStruct callbackStruct;
/**/
callbackStruct.inputProc = &ALAudioUnit::recordingCallback;
callbackStruct.inputProcRefCon = this;
status = AudioUnitSetProperty(audioUnit,
                              kAudioOutputUnitProperty_SetInputCallback,
                              kAudioUnitScope_Global,
                              kInputBus,
                              &callbackStruct,
                              sizeof(callbackStruct));

现在在你的 recordingCallback 中:

OSStatus ALAudioUnit::recordingCallback(void *inRefCon,
                                        AudioUnitRenderActionFlags *ioActionFlags,
                                        const AudioTimeStamp *inTimeStamp,
                                        UInt32 inBusNumber,
                                        UInt32 inNumberFrames,
                                        AudioBufferList *ioData)
{
    // TODO: Use inRefCon to access our interface object to do stuff
    // Then, use inNumberFrames to figure out how much data is available, and make
    // that much space available in buffers in an AudioBufferList.

    // Then:
    // Obtain recorded samples

    OSStatus status;

    ALAudioUnit *pThis = reinterpret_cast<ALAudioUnit*>(inRefCon);
    if (!pThis)
        return noErr;

    //assert (pThis->m_nMaxSliceFrames >= inNumberFrames);

    pThis->recorderBufferList->GetBufferList().mBuffers[0].mDataByteSize = inNumberFrames * pThis->m_recorderSBD.mBytesPerFrame;

    status = AudioUnitRender(pThis->audioUnit,
                             ioActionFlags,
                             inTimeStamp,
                             inBusNumber,
                             inNumberFrames,
                             &pThis->recorderBufferList->GetBufferList());
    THROW_EXCEPTION_IF_ERROR(status, "error rendering audio unit");

    // If we're not playing, I don't care about the data, simply discard it
    if (!pThis->playbackState || pThis->isSeeking) return noErr;

    // Now, we have the samples we just read sitting in buffers in bufferList
    pThis->DoStuffWithTheRecordedAudio(inNumberFrames, pThis->recorderBufferList, inTimeStamp);

    return noErr;
}

顺便说一句，我正在分配自己的缓冲区，而不是使用 AudioUnit 提供的缓冲区。如果您想使用 AudioUnit 分配的缓冲区，您可能想要更改这些部分。

更新:

如何分配自己的缓冲区:

recorderBufferList = new AUBufferList();
recorderBufferList->Allocate(m_recorderSBD, m_nMaxSliceFrames);
recorderBufferList->PrepareBuffer(m_recorderSBD, m_nMaxSliceFrames);

此外，如果您这样做，请告诉 AudioUnit 不要分配缓冲区:

// Disable buffer allocation for the recorder (optional - do this if we want to pass in our own)
flag = 0;
status = AudioUnitSetProperty(audioUnit,
                              kAudioUnitProperty_ShouldAllocateBuffer,
                              kAudioUnitScope_Input,
                              kInputBus,
                              &flag,
                              sizeof(flag));

您需要包含 CoreAudio utility classes

关于ios - 无输出的实时音频处理，我们在Stack Overflow上找到一个类似的问题： https://stackoverflow.com/questions/15551439/

文章推荐： java - JTextArea 在 JFrame 边界截断

文章推荐： ios - 选择单元格时如何获取节标题 View 的标题

文章推荐： ios - UITableViewCell 中的自定义 VoiceOver 操作

performance - 实时，低延迟声音合成和快速处理的语言？
Closed. This question is opinion-based。它当前不接受答案。想改善这个问题吗？更新问题，以便editing this post用事实和引用来回答。 2年前关闭。
javascript - 如何在我的网站中获取用户在线状态(实时)
我想显示我的网站上所有用户都在线(实时；就像任何聊天模块一样)。我正在使用下面提到的脚本来执行此操作。 HTML: Javascript: var doClose = false; documen
Algolia 实时 Webhooks
有什么方法可以知道 Algolia 何时成功处理了排队作业，或者与上次重新索引相比，Algolia 是否索引了新文档？我们希望建立一个系统，每当新文档被索引时，浏览网站的用户都会收到实时更新警告，并
Java - 网络应用程序 - 实时
构建将在“桌面”而不是浏览器中运行的 Java 应用程序的推荐策略是什么。该应用程序的特点是: 1. Multiple application instances would be running o
iphone - 离线时特定时区的iOS“实时”
这是场景: 我正在编写一个医疗相关程序，可以在没有连接的情况下使用。当采取某些措施时，程序会将时间写入CoreData记录。这就是问题所在，如果他们的设备将时间设置为比实际时间早的时间。那将是一个大
Jquery 可拖动/实时
我有: $(document).ready(function () { $(".div1, .div2, .div3, .div4, .div5").draggable();
JQuery:实时标记第二次部分工作
我有以下 jquery 代码: $("a[id*='Add_']").live('click', function() { //Get parentID to add to. var
html - 如何在jsp页面文本区域显示tomcat登录(实时)？
我有一个 jsp 文件，其中包含一个表单。提交表单会调用处理发送的数据的 servlet。我希望当我点击提交按钮时，一个文本区域被跨越并且应该实时显示我的应用程序的日志。我正在使用 Tomcat 7。
c# - 更新页面中的文本框(实时)
我编辑了我的问题，我在 Default.aspx 页面中有一个提交按钮和文本框。我打开两个窗口Default.aspx。我想在这个窗口中向文本框输入文本并按提交，其他窗口将实时更新文本框。请帮助我!
javascript - 如何监控用户在线状态(实时)
我用 php 创建了一个小型 CMS，如果其他用户在线或离线，我想显示已登录的用户。目前，我只创建一个查询请求，但这不会一直更新。我希望用户在发生某些事情时立即看到更改。我正在寻找一个类似于 fac
c++ - *实时*访问光盘文件中的数据
我有以下问题需要解决。我必须构建一个图形查看器来查看海量数据集。我们有一些特定格式的文件，其中包含数百万条代表实验结果的记录。每条记录代表大图上的一个样本点。我见过的最大的文件有 4370 万条记录
php - 检查用户当前是否在线(实时)
我最近完成了申请，但遇到了一个大问题。我一次只需要允许 1 个用户访问它。每个用户每次都可以访问一个索引页面和“开始”按钮。当用户点击开始时，应用程序锁定，其他人需要等到用户完成。当用户关闭选项卡/浏
Android:如何改变输出声音的音调(实时)
我是 Android 开发新手。我正在寻找任何将音高变换应用到输出声音(实时)的方法。但我找不到任何起点。我找到了这个 topic但我仍然不知道如何应用它。有什么建议吗？最佳答案一般来说，该算
实时 PHP 套接字
背景用户计算机上的桌面应用程序从调制解调器获取电话号码，并在接到电话后将其发送到 PHP 脚本。目前，我可以通过 PHP 在指定端口上接收数据/数据包。然后我有一个连接到 411 数据库并返回指定电
c# - 实时、迭代应用架构
很抱歉提出抽象问题，但我正在寻找一些关于在循环中执行一些等效操作的应用程序类型的示例/建议/文章，并且循环的每次迭代都应该在特定时间部分公开其结果(例如， 10 秒)。我的应用程序在外部 WCF 服
c++ - 实时、用户时间和系统时间的区别
这个问题在这里已经有了答案: 关闭 10 年前。 Possible Duplicate: What specifically are wall-clock-time, user-cpu-time,
c# - 如何正确更新我的图表值？ (实时)
我最近遇到了一个叫做 LiveChart 的工具，决定试用一下。不幸的是，我在弄清楚如何实时更新图表值时遇到了一些问题。我很确定有一种干净正确的方法可以做到这一点，但我找不到它。我希望能够通过 p
dart - 实时 flutter
我正在实现实时 flutter 库 https://pub.dartlang.org/packages/true_time 遇到错误 W/DiskCacheClient(26153): Cannot
Instagram 实时 API 更新很少
我一直在使用 instagram 的实时推送 api ( http://instagram.com/developer/realtime/ ) 来获取特定位置的更新。我使用“半径”的最大可能值，即 5
stocks - 实时/高分辨率股票 API？
关闭。这个问题不满足Stack Overflow guidelines .它目前不接受答案。想改善这个问题吗？更新问题，使其成为 on-topic对于堆栈溢出。 7年前关闭。 Improve thi

可可西里

个人简介

我是一名优秀的程序员,十分优秀！

作者热门文章

滴滴打车优惠券免费领取

全站热门文章

首页

博学

6Ren·AI

商城

ios - 无输出的实时音频处理