Android.Media.MediaRecorder - 录制音频时有延迟,有部分静音

Android.Media.MediaRecorder - delay when recording audio, with sections of silence

请帮忙解决问题。要录制音频文件,我使用 Android.Media.MediaRecorder。结果,我得到了一个在文件开头和结尾有 650 毫秒静音的部分。结果发现开头和结尾的那部分乐句没有录下来,只有沉默。

public static async Task Record(CancellationToken token)
    {
        try
        {
            var filename = System.Environment.GetFolderPath(System.Environment.SpecialFolder.Personal) + "/temp.amr";
            var tmp = new Java.IO.File(filename);
            if (tmp.Exists()) tmp.Delete();
            var recorder = new MediaRecorder();
            recorder.SetAudioSource(AudioSource.Mic);
            recorder.SetOutputFormat(OutputFormat.AmrNb);
            recorder.SetAudioEncoder(AudioEncoder.AmrNb);
            recorder.SetOutputFile(filename);
            recorder.Prepare();
            recorder.Start();
            try
            {
                var div = MAX_RECORD_TIME / 100;
                for(int i=0; i<div; i++)
                {
                    IncrementProgressBar(100 / div);
                    await Task.Delay(div, token);
                }
                fSave = true;
            }
            catch (OperationCanceledException) { }
            recorder.Stop();
        }
        catch (Exception e)
        {
            string s = context.GetText(Resource.String.err_unexpected) + "\r" + e.Message;
            handler.ToastMessage(s, ToastLength.Short);
        }
    }

此问题无法通过代码解决,看来是硬件问题。 您可以在默认相机应用程序中看到相同的延迟,该应用程序也使用 MediaRecorder。 不幸的是,某些设备的行为会有所不同。

解决方案是使用 AudioRecorder class,它更灵活,因为它更接近硬件

为自己找到了解决方案。以下代码正在运行,可能对某人有用。

    public static async Task Record(CancellationToken token)
    {
        var filename = Environment.GetFolderPath(System.Environment.SpecialFolder.Personal) + "/wav.pcm";
        System.IO.Stream outputStream = System.IO.File.Open(filename, FileMode.Create);
        BinaryWriter bWriter = new BinaryWriter(outputStream);
        var audioBuffer = new byte[8000];
        var audRecorder = new AudioRecord(AudioSource.Mic, 8000, ChannelIn.Mono, Encoding.Pcm16bit, audioBuffer.Length);
        while(audRecorder.State != State.Initialized) { }
        audRecorder.StartRecording();
        while (!token.IsCancellationRequested)
        {
            try
            {
                var audioData = await audRecorder.ReadAsync(audioBuffer, 0, audioBuffer.Length);
                bWriter.Write(audioBuffer);
                IncrementProgressBar(1);
            }
            catch (Exception ex)
            {
                System.Console.Out.WriteLine("INFO: " + ex.Message);
                break;
            }
        }
        outputStream.Close();
        bWriter.Close();
        audRecorder.Stop();
        audRecorder.Release();
        fSave = true;
    }
    public static async Task Play(CancellationToken token)
    {
        var filename = Environment.GetFolderPath(Environment.SpecialFolder.Personal) + "/wav.pcm";
        var audBuffer = await System.IO.File.ReadAllBytesAsync(filename, token);
        var bufferSizeInBytes = audBuffer.Length / 2;
        AudioTrack audioTrack;
        if (Android.OS.Build.VERSION.SdkInt >= Android.OS.BuildVersionCodes.Lollipop)
        {
            AudioAttributes attributes = new AudioAttributes.Builder().SetLegacyStreamType(Android.Media.Stream.Music)
                                                                    .Build();
            AudioFormat format = new AudioFormat.Builder().SetChannelMask(ChannelOut.Mono)
                                                            .SetEncoding(Encoding.Pcm16bit)
                                                            .SetSampleRate(8000)
                                                            .Build();
            audioTrack = new AudioTrack(attributes, format, bufferSizeInBytes, AudioTrackMode.Stream, 1);
        }
        else
        {
            audioTrack = new AudioTrack(Android.Media.Stream.Music, 8000, ChannelOut.Mono,
                                        Encoding.Pcm16bit, bufferSizeInBytes, AudioTrackMode.Stream);
        }
        audioTrack.Play();
        await audioTrack.WriteAsync(audBuffer, 0, bufferSizeInBytes*2);
        try
        {
            await Task.Delay(((bufferSizeInBytes/8000)-1)*1000, token);
        }
        catch (OperationCanceledException) { }
        audioTrack.Stop();
        audioTrack.Release();
    }      
    public static async Task SaveAsAmr()
    {
        var encoder = MediaCodec.CreateEncoderByType(MediaFormat.MimetypeAudioAmrNb);
        MediaFormat format = new MediaFormat();
        format.SetString(MediaFormat.KeyMime, MediaFormat.MimetypeAudioAmrNb);
        format.SetInteger(MediaFormat.KeySampleRate, 8000);
        format.SetInteger(MediaFormat.KeyChannelCount, 1);
        format.SetInteger(MediaFormat.KeyBitRate, 7936);
        encoder.Configure(format, null, null, MediaCodecConfigFlags.Encode);

        try
        {
            Java.IO.File pcmFile = new Java.IO.File(Environment.GetFolderPath(Environment.SpecialFolder.Personal) + "/wav.pcm");
            FileInputStream fis = new FileInputStream(pcmFile);
            Java.IO.File armFIle = new Java.IO.File(Environment.GetFolderPath(Environment.SpecialFolder.Personal) + "/wav.amr");
            FileOutputStream fos = new FileOutputStream(armFIle);
            fos.Write(System.Text.Encoding.ASCII.GetBytes("#!AMR\n"));
            encoder.Start();

            var tempBuffer = new byte[8000];
            var hasMoreData = true;
            MediaCodec.BufferInfo outBuffInfo = new MediaCodec.BufferInfo();
            double presentationTimeUs = 0;
            int totalBytesRead = 0;

            do
            {
                int inputBufIndex = 0;
                while (inputBufIndex != -1 && hasMoreData)
                {
                    inputBufIndex = encoder.DequeueInputBuffer(0);
                    if (inputBufIndex >= 0)
                    {
                        Java.Nio.ByteBuffer dstBuf;
                        if (Android.OS.Build.VERSION.SdkInt >= Android.OS.BuildVersionCodes.Lollipop)
                        {
                            dstBuf = encoder.GetInputBuffer(inputBufIndex);
                        }
                        else
                        {
                            dstBuf = encoder.GetInputBuffers()[inputBufIndex];
                        }
                        dstBuf.Clear();

                        int bytesRead = await fis.ReadAsync(tempBuffer, 0, dstBuf.Limit());
                        if (bytesRead == -1)
                        { // -1 implies EOS
                            hasMoreData = false;
                            encoder.QueueInputBuffer(inputBufIndex, 0, 0, (long)presentationTimeUs, MediaCodecBufferFlags.EndOfStream);
                        }
                        else
                        {
                            totalBytesRead += bytesRead;
                            dstBuf.Put(tempBuffer, 0, bytesRead);
                            encoder.QueueInputBuffer(inputBufIndex, 0, bytesRead, (long)presentationTimeUs, 0);
                            presentationTimeUs = 1000000L * (totalBytesRead / 2) / 8000;
                        }
                    }
                }
                // Drain audio
                int outputBufIndex = 0;
                while (outputBufIndex != (int)MediaCodecInfoState.TryAgainLater)
                {
                    outputBufIndex = encoder.DequeueOutputBuffer(outBuffInfo, 0);
                    if (outputBufIndex >= 0)
                    {
                        Java.Nio.ByteBuffer encodedData;
                        if (Android.OS.Build.VERSION.SdkInt >= Android.OS.BuildVersionCodes.Lollipop)
                        {
                            encodedData = encoder.GetOutputBuffer(outputBufIndex);
                        }
                        else
                        {
                            encodedData = encoder.GetOutputBuffers()[outputBufIndex];
                        }
                        encodedData.Position(outBuffInfo.Offset);
                        encodedData.Limit(outBuffInfo.Offset + outBuffInfo.Size);
                        byte[] outData = new byte[outBuffInfo.Size];
                        encodedData.Get(outData, 0, outBuffInfo.Size);
                        fos.Write(outData, 0, outBuffInfo.Size);
                        encoder.ReleaseOutputBuffer(outputBufIndex, false);
                    }
                }
            } while (outBuffInfo.Flags != MediaCodecBufferFlags.EndOfStream);
            fis?.Close();
            fos?.Flush();
            fos?.Close();
        }
        catch(Exception ex)
        {
            System.Console.Out.WriteLine("INFO: " + ex.Message);
        }
    }