Problem while encoding PCM Stereo file to M4A stereo

I am facing an issue while encoding M4A stereo file from PCM. My code works perfectly for MONO encoding (means Channel count =1) but for stereo(channel count =2) it's not working. The problem is that the encoder doubles the duration of audio.

I have logged the sample rate and channel, both are perfect i.e., 48.100kHz sample rate and 2 channel count.

Below is my encoding method code:

public boolean mediaMux(){
        try {

            File outputDirectory = new File(outFilePath);
            if (!outputDirectory.exists()){
            File outputFile = new File(outputDirectory.getPath() , outFileName + ".m4a");
            if (outputFile.exists()) outputFile.delete();

            MediaMuxer mux = null;
            mux = new MediaMuxer(outputFile.getAbsolutePath(), MediaMuxer.OutputFormat.MUXER_OUTPUT_MPEG_4);

            MediaFormat outputFormat = MediaFormat.createAudioFormat(COMPRESSED_AUDIO_FILE_MIME_TYPE,
                    sampleRate, channel);
            outputFormat.setInteger(MediaFormat.KEY_AAC_PROFILE, MediaCodecInfo.CodecProfileLevel.AACObjectLC);
            outputFormat.setInteger(MediaFormat.KEY_BIT_RATE, bitrate);

            MediaCodec codec = MediaCodec.createEncoderByType(COMPRESSED_AUDIO_FILE_MIME_TYPE);
            codec.configure(outputFormat, null, null, MediaCodec.CONFIGURE_FLAG_ENCODE);

            ByteBuffer[] codecInputBuffers = codec.getInputBuffers(); // Note: Array of buffers
            ByteBuffer[] codecOutputBuffers = codec.getOutputBuffers();

            MediaCodec.BufferInfo outBuffInfo = new MediaCodec.BufferInfo();

            byte[] tempBuffer = new byte[bufferSize];

            double presentationTimeUs = 0;
            int audioTrackIdx = 0;
            int totalBytesRead = 0;
            int percentComplete;

            do {

                int inputBufIndex = 0;
                while (inputBufIndex != -1 && data.size() > 0) {
                    try {
                        Log.w("Read Log","Reading Data");
                        inputBufIndex = codec.dequeueInputBuffer(CODEC_TIMEOUT_IN_MS);

                        if (inputBufIndex >= 0) {
                            ByteBuffer dstBuf = codecInputBuffers[inputBufIndex];

                            byte[] a = data.remove();

                            int bytesRead = a.length;
                            //Log.w("DestBuffer Limit",dstBuf.limit() +"");
                            if (!hasMoreData) { // -1 implies EOS

                                codec.queueInputBuffer(inputBufIndex, 0, 0, (long) presentationTimeUs, MediaCodec.BUFFER_FLAG_END_OF_STREAM);
                            } else {
                                totalBytesRead += bytesRead;
                                dstBuf.put(a, 0, bytesRead);
                                codec.queueInputBuffer(inputBufIndex, 0, bytesRead, (long) presentationTimeUs, 0);
                                presentationTimeUs = 1000000l * (totalBytesRead / 2) / sampleRate;
                    }catch (NoSuchElementException ex){

                // Drain audio
                int outputBufIndex = 0;
                while (outputBufIndex != MediaCodec.INFO_TRY_AGAIN_LATER) {
                    Log.w("Write Log","Writing Data");
                    outputBufIndex = codec.dequeueOutputBuffer(outBuffInfo, CODEC_TIMEOUT_IN_MS);
                    if (outputBufIndex >= 0) {
                        ByteBuffer encodedData = codecOutputBuffers[outputBufIndex];
                        encodedData.limit(outBuffInfo.offset + outBuffInfo.size);

                        if ((outBuffInfo.flags & MediaCodec.BUFFER_FLAG_CODEC_CONFIG) != 0 && outBuffInfo.size != 0) {
                            codec.releaseOutputBuffer(outputBufIndex, false);
                        } else {
                            mux.writeSampleData(audioTrackIdx, codecOutputBuffers[outputBufIndex], outBuffInfo);
                            codec.releaseOutputBuffer(outputBufIndex, false);
                    } else if (outputBufIndex == MediaCodec.INFO_OUTPUT_FORMAT_CHANGED) {
                        outputFormat = codec.getOutputFormat();
                        Log.v(LOGTAG, "Output format changed - " + outputFormat);
                        audioTrackIdx = mux.addTrack(outputFormat);
                    } else if (outputBufIndex == MediaCodec.INFO_OUTPUT_BUFFERS_CHANGED) {
                        Log.e(LOGTAG, "Output buffers changed during encode!");
                    } else if (outputBufIndex == MediaCodec.INFO_TRY_AGAIN_LATER) {
                        // NO OP
                    } else {
                        Log.e(LOGTAG, "Unknown return code from dequeueOutputBuffer - " + outputBufIndex);
                //percentComplete = (int) Math.round(((float) totalBytesRead / (float) inputFile.length()) * 100.0);
                Log.v(LOGTAG, "Conversion % - " );
            } while (outBuffInfo.flags != MediaCodec.BUFFER_FLAG_END_OF_STREAM && !mStop);

            Log.v(LOGTAG, "Compression done ...");
        } catch (FileNotFoundException e) {
            Log.e(LOGTAG, "File not found!", e);
            return false;
        } catch (IOException e) {
            Log.e(LOGTAG, "IO exception!", e);
            return false;
        } catch (Exception e){

        return true;

Update Recording audio code chuck

recorder = new AudioRecord(
                MediaRecorder.AudioSource.MIC, recordingSampleRate,
                AudioFormat.ENCODING_PCM_16BIT, minBufferSize * 2);

if User selects mono, recordingChannels = AudioFormat.CHANNEL_IN_MONO and for stereo recording channels = AudioFormat.CHANNEL_IN_STEREO Thanks in advance


  • I think

    presentationTimeUs = 1000000l * (totalBytesRead / 2) / sampleRate;

    should actually be

    presentationTimeUs = 1000000l * (totalBytesRead / (2 * channel)) / sampleRate;

    as you have 2 bytes per sample per channel, i.e. 4 bytes per sample for stereo.