android - android 的语音增强/降噪/降噪库-6ren

android - android 的语音增强/降噪/降噪库

转载作者：行者123 更新时间：2023-11-29 01:06:24

我正在开发一个具有语音识别功能的应用程序，使用内置于 SpeechRecognizer 和 RecognizerIntent 的 android。是否有任何适用于 android 的降噪或降噪库可以集成到我的应用程序中以提高语音识别的准确性？我在 android 中看到了一个 NoiseSuppressor 类，但我不知道如何将它集成到 SpeechRecognizer 中。我是 android 编程领域的新手。提前致谢

public class MainActivity extends AppCompatActivity implements RecognitionListener {

private AudioRecord audioRecord;
private TextView returnedText;
private Button editButton;
private Button clearButton;
private ToggleButton toggleButton;
private ProgressBar progressBar;
private SpeechRecognizer speech ;
private Intent recognizerIntent, editIntent;
private String LOG_TAG = "MainActivity";

@Override
protected void onCreate(Bundle savedInstanceState) {
    super.onCreate(savedInstanceState);
    setContentView(R.layout.activity_main);

    //for noise suppressor checking
    int N = AudioRecord.getMinBufferSize(48000,AudioFormat.CHANNEL_IN_MONO,AudioFormat.ENCODING_PCM_16BIT);
    audioRecord = new AudioRecord(MediaRecorder.AudioSource.MIC, 8000, AudioFormat.CHANNEL_IN_MONO, AudioFormat.ENCODING_PCM_16BIT, N*10);
    int sessionId = audioRecord.getAudioSessionId();
    NoiseSuppressor noiseSuppresor = NoiseSuppressor.create(sessionId);

    if(noiseSuppresor == null){
        Toast.makeText(this, "No Suppersor", Toast.LENGTH_LONG).show();
    }else{
        Toast.makeText(this, "Have Suppersor", Toast.LENGTH_LONG).show();
    }

    returnedText = (TextView) findViewById(R.id.textView1);
    progressBar = (ProgressBar) findViewById(R.id.progressBar1);
    toggleButton = (ToggleButton) findViewById(R.id.toggleButton1);
    editButton = (Button)findViewById(R.id.button1);
    clearButton = (Button)findViewById(R.id.button2);

    progressBar.setVisibility(View.INVISIBLE);

    toggleButton.setOnCheckedChangeListener(new CompoundButton.OnCheckedChangeListener() {

        @Override
        public void onCheckedChanged(CompoundButton buttonView, boolean isChecked) {
            initSpeech();
            if (isChecked) {
                progressBar.setVisibility(View.VISIBLE);
                progressBar.setIndeterminate(true);
                speech.startListening(recognizerIntent);
            } else {
                progressBar.setIndeterminate(false);
                progressBar.setVisibility(View.INVISIBLE);
                speech.stopListening();
            }
        }
    });

    clearButton.setOnClickListener(new View.OnClickListener() {
        @Override
        public void onClick(View v) {
            returnedText.setText("");
        }
    });

    editButton.setOnClickListener(new View.OnClickListener() {
        @Override
        public void onClick(View v) {
            editIntent = new Intent(MainActivity.this, EditorActivity.class);
            String forEditText = returnedText.getText().toString();
            editIntent.putExtra("forEdit", forEditText);
            startActivity(editIntent);
        }
    });


}

private void initSpeech(){

    speech = SpeechRecognizer.createSpeechRecognizer(this);
    speech.setRecognitionListener(this);
    recognizerIntent = new Intent(RecognizerIntent.ACTION_RECOGNIZE_SPEECH);
    recognizerIntent.putExtra(RecognizerIntent.EXTRA_LANGUAGE_PREFERENCE,"en");
    recognizerIntent.putExtra(RecognizerIntent.EXTRA_CALLING_PACKAGE, this.getPackageName());
    recognizerIntent.putExtra(RecognizerIntent.EXTRA_LANGUAGE_MODEL, RecognizerIntent.LANGUAGE_MODEL_FREE_FORM);
    recognizerIntent.putExtra(RecognizerIntent.EXTRA_PARTIAL_RESULTS, true);
    recognizerIntent.putExtra(RecognizerIntent.EXTRA_PREFER_OFFLINE, true);
    recognizerIntent.putExtra("android.speech.extra.DICTATION_MODE", true);
    recognizerIntent.putExtra(RecognizerIntent.EXTRA_SPEECH_INPUT_POSSIBLY_COMPLETE_SILENCE_LENGTH_MILLIS, 5000);
}

@Override
public void onResume() {
    super.onResume();
}

@Override
protected void onPause() {
    super.onPause();
    if (speech != null) {
        speech.stopListening();
        speech.cancel();
        Log.i(LOG_TAG, "destroy");
    }


}

@Override
public void onBeginningOfSpeech() {
    Log.i(LOG_TAG, "onBeginningOfSpeech");
    progressBar.setIndeterminate(false);
    progressBar.setMax(10);
}

@Override
public void onBufferReceived(byte[] buffer) {
    Log.i(LOG_TAG, "onBufferReceived: " + buffer);
}

@Override
public void onEndOfSpeech() {
    Log.i(LOG_TAG, "onEndOfSpeech");
    progressBar.setIndeterminate(true);
    toggleButton.setChecked(false);
    speech.destroy();
}

@Override
public void onError(int errorCode) {
    String errorMessage = getErrorText(errorCode);
    Log.d(LOG_TAG, "FAILED " + errorMessage);
    returnedText.setText(errorMessage);
    toggleButton.setChecked(false);
    speech.destroy();
}

@Override
public void onEvent(int arg0, Bundle arg1) {
    Log.i(LOG_TAG, "onEvent");
}

@Override
public void onPartialResults(Bundle partialResults) {
    ArrayList<String> matches = partialResults
            .getStringArrayList(SpeechRecognizer.RESULTS_RECOGNITION);
    String text = "";
    for (String result : matches)
        text += result + "\n";

    returnedText.setText(text);
}

@Override
public void onReadyForSpeech(Bundle arg0) {
    Log.i(LOG_TAG, "onReadyForSpeech");
}

@Override
public void onResults(Bundle results) {
    Log.i(LOG_TAG, "onResults");
    ArrayList<String> matches = results
            .getStringArrayList(SpeechRecognizer.RESULTS_RECOGNITION);
    String text = "";
    for (String result : matches)
        text += result + "\n";

    returnedText.append(text);
    speech.destroy();
}

@Override
public void onRmsChanged(float rmsdB) {
    Log.i(LOG_TAG, "onRmsChanged: " + rmsdB);
    progressBar.setProgress((int) rmsdB);
}

public static String getErrorText(int errorCode) {
    String message;
    switch (errorCode) {
        case SpeechRecognizer.ERROR_AUDIO:
            message = "Audio recording error";
            break;
        case SpeechRecognizer.ERROR_CLIENT:
            message = "Client side error";
            break;
        case SpeechRecognizer.ERROR_INSUFFICIENT_PERMISSIONS:
            message = "Insufficient permissions";
            break;
        case SpeechRecognizer.ERROR_NETWORK:
            message = "Network error";
            break;
        case SpeechRecognizer.ERROR_NETWORK_TIMEOUT:
            message = "Network timeout";
            break;
        case SpeechRecognizer.ERROR_NO_MATCH:
            message = "No match";
            break;
        case SpeechRecognizer.ERROR_RECOGNIZER_BUSY:
            message = "RecognitionService busy";
            break;
        case SpeechRecognizer.ERROR_SERVER:
            message = "error from server";
            break;
        case SpeechRecognizer.ERROR_SPEECH_TIMEOUT:
            message = "No speech input";
            break;
        default:
            message = "Didn't understand, please try again.";
            break;
    }
    return message;
}

最佳答案

只需以这种方式在您的 AudioManager 中添加“noise_suppression=on”:

yourAudioManager.setParameters("noise_suppression=on");

关于android - android 的语音增强/降噪/降噪库，我们在Stack Overflow上找到一个类似的问题： https://stackoverflow.com/questions/46762235/

文章推荐： android - 返回在内部 fragment 中不起作用

文章推荐： android - 在 kotlin android tailrec 函数中返回 0

android - Android:Android Studio中的Gradle错误
我最近在/ drawable中添加了一些.gifs，以便可以将它们与按钮一起使用。这个工作正常(没有错误)。现在，当我重建/运行我的应用程序时，出现以下错误: Error: Gradle: Execu
android - (Android) 在内部存储中查找路径/Android
Android 中有返回内部存储数据路径的方法吗？我有 2 部 Android 智能手机(Samsung s2 和 s7 edge)，我在其中安装了一个应用程序。我想使用位于这条路径中的 sqlit
android - @android : and ? android 之间有什么区别:
这个问题在这里已经有了答案: What's the difference between "?android:" and "@android:" in an android layout xml f
android - Android 开发手机、Android 普通手机和 Android root 手机之间的区别
我只想知道 android 开发手机、android 普通手机和 android root 手机之间的实际区别。我们不能从实体店或除 android marketplace 以外的其他地方购买开发手
android - Android-android-apt插件与Android Gradle插件不兼容。
自Gradle更新以来，我正在努力使这个项目达到标准。这是一个团队项目，它使用的是android-apt插件。我已经进行了必要的语法更改(编译->实现和apt->注释处理器)，但是编译器仍在告诉我存在
android - Android Spinner未填充| Android Kotlin
我是android和kotlin的新手，所以请原谅要解决的一个非常简单的问题! 我已经使用导航体系结构组件创建了一个基本应用程序，使用了底部的导航栏和三个导航选项。每个导航选项都指向一个专用片段，该片
android - Facebook android，获取应用程序流 - Android
我目前正在使用 Facebook official SDK for Android . 我现在正在使用高级示例应用程序，但我不知道如何让它获取应用程序墙/流/状态而不是登录的用户。这可能吗？在那种情
android - 无法在 Android 手机中下载文件 - Android..？
我在下载文件时遇到问题，我可以在模拟器中下载文件，但无法在手机上使用。我已经定义了上网和写入 SD 卡的权限。我在服务器上有一个 doc 文件，如果用户单击下载。它下载文件。这在模拟器中工作正常但
android - android :layout_gravity and android:gravity之间的区别
这个问题在这里已经有了答案: What is the difference between gravity and layout_gravity in Android? (22 个答案) 关闭 9
android - Android 缓存内存和 Android 应用程序缓存内存有什么区别
任何人都可以告诉我什么是 android 缓存和应用程序缓存，因为当我们谈论缓存清理应用程序时，它的作用是，缓存清理概念是清理应用程序缓存还是像内存管理一样主存储、RAM、缓存是不同的并且据我所知，缓
android - Android 应用程序能否知道另一个 Android 应用程序何时运行？
假设应用程序 Foo 和 Eggs 在同一台 Android 设备上。任一应用程序都可以获取设备上所有应用程序的列表。一个应用程序是否有可能知道另一个应用程序是否已经运行以及运行了多长时间？最佳答案
android - Webrtc Android 到 Android？
我有点困惑，我只看到了从 android 到 pc 或者从 android 到 pc 的例子。我需要制作一个从两部手机 (android) 连接的 android 应用程序进行视频聊天。我在想，我知道
android - Android 的锁屏无法使用 Android 正常工作
用于使用 Android 以编程方式锁定屏幕。我从 Stackoverflow 之前关于此的问题中得到了一些好主意，并且我做得很好，但是当我运行该代码时，没有异常和错误。而且，屏幕没有锁定。请在这段代
android - android :layout_alignParentTop and android:layout_alignParentStart之间的区别
文档说: android:layout_alignParentStart If true, makes the start edge of this view match the start edge
android - android :layout_width and android:width有什么区别
我不知道这两个属性和高度之间的区别。以一个TextView为例，如果我将它的layout_width设置为wrap_content，并将它的width设置为50 dip，会发生什么情况？最佳答案
android - android :noHistory and android:finishOnTaskLaunch之间的关系
这两个属性有什么关系？如果我有 android:noHistory="true"，那么有 android:finishOnTaskLaunch="true" 有什么意义吗？最佳答案假设您的应用中有
android - 什么时候使用 "?android"或 "@android"？
我是新手，正在尝试理解以下 XML 代码: 查看 developer.android.com 上的文档，它说“starStyle”是 R.attr 中的常量， public static final
android - android :width and android:layout_width之间的区别
在下面的代码中，为什么当我设置时单选按钮的外观会发生变化 android:layout_width="fill_parent" 和 android:width="fill_parent" 我说的是
android - Android 移动应用程序可以在 Android 平板电脑上运行吗？
很难说出这里要问什么。这个问题模棱两可、含糊不清、不完整、过于宽泛或夸夸其谈，无法以目前的形式得到合理的回答。如需帮助澄清此问题以便重新打开，visit the help center . 关闭 9
android - 如何在 android 中保存函数调用并在以后再次使用它 Android
假设我有一个函数 fun myFunction(name:String, email:String){}，当我调用这个函数时 myFunction('Ali', 'ali@test.com ') 如何

行者123

个人简介

我是一名优秀的程序员,十分优秀！

作者热门文章

滴滴打车优惠券免费领取

全站热门文章

首页

博学

6Ren·AI

商城

android - android 的语音增强/降噪/降噪库