使用语音识别打开应用程序(PocketSphinx)

时间:2018-01-21 19:50:51

标签: android speech-recognition voice-recognition pocketsphinx pocketsphinx-android

我想在Android中创建一个语音识别应用程序并在服务中运行它,所以我甚至可以在应用程序中使用它。所以我寻找参考,我在GitHub中找到了一个演示应用程序。

这是网站https://github.com/ihrupin/SpeechRecognitionService

我下载应用程序并且我也阅读了文档,是的,它运行良好,它也运行在服务中,但我真的想要的是例如,如果我说(打开Facebook)它将打开已安装的Facebook应用程序。

我是使用PocketSphinx的新手。

这是MainActivity

public class MainActivity extends AppCompatActivity {

private static final int PERMISSIONS_REQUEST_RECORD_AUDIO = 1;
private static final String LOG_TAG = MainActivity.class.getSimpleName();

@Override
protected void onCreate(Bundle savedInstanceState) {
    super.onCreate(savedInstanceState);
    setContentView(R.layout.activity_main);

    ((Button)findViewById(R.id.btn)).setOnClickListener(new View.OnClickListener() {
        @Override
        public void onClick(View v) {
            Log.i(LOG_TAG, "onClick");
            int permissionCheck = ContextCompat.checkSelfPermission(getApplicationContext(), Manifest.permission.RECORD_AUDIO);
            if (permissionCheck == PackageManager.PERMISSION_DENIED) {
                ActivityCompat.requestPermissions(MainActivity.this, new String[]{Manifest.permission.RECORD_AUDIO}, PERMISSIONS_REQUEST_RECORD_AUDIO);
                return;
            }
            startService(new Intent(MainActivity.this, VoiceService.class));
        }
    });
}

@Override
public void onRequestPermissionsResult(int requestCode,
                                       String[] permissions, int[] grantResults) {
    super.onRequestPermissionsResult(requestCode, permissions, grantResults);

    if (requestCode == PERMISSIONS_REQUEST_RECORD_AUDIO) {
        if (grantResults.length > 0 && grantResults[0] == PackageManager.PERMISSION_GRANTED) {
            startService(new Intent(MainActivity.this, VoiceService.class));
        } else {
            finish();
        }
    }
}
}

这是我的服务

public class VoiceService extends Service implements
    RecognitionListener {

private static final String LOG_TAG = VoiceService.class.getSimpleName();



private static final String KWS_SEARCH = "wakeup";


private static final String KEYPHRASE = "lisa";

private SpeechRecognizer recognizer;

@Nullable
@Override
public IBinder onBind(Intent intent) {
    return null;
}

@Override
public int onStartCommand(Intent intent, int flags, int startId) {


    int permissionCheck = ContextCompat.checkSelfPermission(getApplicationContext(), Manifest.permission.RECORD_AUDIO);
    if (permissionCheck == PackageManager.PERMISSION_GRANTED) {
        runRecognizerSetup();
    }
    return super.onStartCommand(intent, flags, startId);
}

private void runRecognizerSetup() {

    new AsyncTask<Void, Void, Exception>() {
        @Override
        protected Exception doInBackground(Void... params) {
            try {
                Assets assets = new Assets(VoiceService.this);
                File assetDir = assets.syncAssets();
                setupRecognizer(assetDir);
            } catch (IOException e) {
                return e;
            }
            return null;
        }

        @Override
        protected void onPostExecute(Exception result) {
            if (result != null) {
                Log.i(LOG_TAG, "Failed to init recognizer ");
            } else {
                switchSearch(KWS_SEARCH);
            }
        }
    }.execute();
}

@Override
public void onDestroy() {
    super.onDestroy();

    if (recognizer != null) {
        recognizer.cancel();
        recognizer.shutdown();
    }
}


@Override
public void onPartialResult(Hypothesis hypothesis) {
    if (hypothesis == null)
        return;

    String text = hypothesis.getHypstr();
    if (text.contains(KEYPHRASE)) {
        Toast.makeText(this, "onPartialResult text=" + text, Toast.LENGTH_SHORT).show();
        switchSearch(KWS_SEARCH);
    }

    Log.i(LOG_TAG, "onPartialResult text=" +text);
}


@Override
public void onResult(Hypothesis hypothesis) {
    if (hypothesis != null) {
        String text = hypothesis.getHypstr();
        Log.i(LOG_TAG, "onResult text=" +text);

    }
}

@Override
public void onBeginningOfSpeech() {
    Log.i(LOG_TAG, "onBeginningOfSpeech");
}


@Override
public void onEndOfSpeech() {
    if (!recognizer.getSearchName().contains(KWS_SEARCH))
        switchSearch(KWS_SEARCH);
    Log.i(LOG_TAG, "onEndOfSpeech");
}

private void switchSearch(String searchName) {
    Log.i(LOG_TAG, "switchSearch searchName = " + searchName);
    recognizer.stop();


    recognizer.startListening(searchName, 10000);
}

private void setupRecognizer(File assetsDir) throws IOException {


    recognizer = SpeechRecognizerSetup.defaultSetup()
            .setAcousticModel(new File(assetsDir, "en-us-ptm"))
            .setDictionary(new File(assetsDir, "cmudict-en-us.dict"))

            .setRawLogDir(assetsDir)
            .setKeywordThreshold(1e-45f)
            .setBoolean("-allphone_ci", true)


            .getRecognizer();
    recognizer.addListener(this);


    recognizer.addKeyphraseSearch(KWS_SEARCH, KEYPHRASE);
}

@Override
public void onError(Exception error) {
    Log.i(LOG_TAG, "onError " + error.getMessage());
}

@Override
public void onTimeout() {
    switchSearch(KWS_SEARCH);
    Log.i(LOG_TAG, "onTimeout");
}
}

这是BootReceiver

public class BootReceiver extends BroadcastReceiver {
private static final String LOG_TAG = BootReceiver.class.getSimpleName();

@Override
public void onReceive(Context context, Intent intent) {
    Log.i(LOG_TAG, "onReceive");
    if(intent.getAction().equals(Intent.ACTION_BOOT_COMPLETED)){
        Log.i(LOG_TAG, "onReceive onBoot");
        context.startService(new Intent(context, VoiceService.class));
    }
}
}

我研究了这个主题,我发现我必须修改语法和字典,但我不知道该怎么做。有什么想法吗?

1 个答案:

答案 0 :(得分:0)

如果你想修改现有的语法并想要添加你自己的单词,你必须稍微修改一下。 在识别器设置方法中写下这一行。

  

recognizer.addKeyphraseSearch(“facebookPhrase”,“Open Facebook”);

要编辑此示例,您可以在官方网站上阅读

<强> https://cmusphinx.github.io/wiki/tutoriallm/