使用 Java 合并 2 个 AAC 文件

Posted

技术标签:

【中文标题】使用 Java 合并 2 个 AAC 文件【英文标题】:Combine 2 AAC files using Java 【发布时间】:2012-09-25 00:54:04 【问题描述】:

我试图将 2 个 AAC 文件合并为一个,我发现在 AAC 文件中 - 标题元素一直存在到 FF8 字节,然后接下来的 4 个字节包含 AAC 数据的长度。我试着维护1个header数组,把2个AAC文件的大小相加,然后把两个文件的数据缓冲区一个接一个地加进去。

生成的文件仅播放第一个 AAC 文件。这是代码sn-p。

FileInputStream fs = new FileInputStream("./res/after.aac");

dis = new DataInputStream(fs);
headerData = new byte[0xFF8];
dis.read(headerData);


int lengthTotal = dis.readInt();
System.out.println("Length of After == "+lengthTotal);
dis.readInt();


data = new byte[dis.available()];

dis.readFully(data);
dis.close();
dis = null;
fs.close();
fs = null;


fs = new FileInputStream("./res/continue.aac");
dis = new DataInputStream(fs);

dis.skipBytes(0xFF8);

int length = dis.readInt();
System.out.println("Length of Ahead == "+length);
lengthTotal = lengthTotal + length -8;
System.out.println("Total Length== "+lengthTotal);
dis.readInt();
newData = new byte[dis.available()];
dis.read(newData);

FileOutputStream fos = new FileOutputStream("./res/combine.aac");
DataOutputStream dos = new DataOutputStream(fos);

dos.write(headerData);
dos.writeInt(lengthTotal);
dos.writeBytes("mdat");
dos.write(data);
dos.write(newData);

我知道在第 56 个字节中有关于 AAC 文件持续时间的信息,但我无法弄清楚。有人可以帮我吗?

【问题讨论】:

我也在尝试同样的方法...你解决了吗?有什么解决办法吗? 【参考方案1】:

我建议你看看jaad库中aac文件是如何解析的,特别有趣的是ADTS处理代码here和ADIF头解析here。

【讨论】:

【参考方案2】:

好吧,我不能告诉你你做错了什么。但我可以告诉你如何做你想做的事。

首先创建一个General Helper Functions:

    public static class General 
    public static void CopyBytes(byte[] dst, int dstOffset, byte[] src) 
        Buffer.BlockCopy(src, 0, dst, dstOffset, src.Length);
    


public static class BitHelper 
    public static int Read(ref ulong x, int length) 
        int r = (int)(x >> (64 - length));
        x <<= length;
        return r;
    

    public static int Read(byte[] bytes, ref int offset, int length) 
        int startByte = offset / 8;
        int endByte = (offset + length - 1) / 8;
        int skipBits = offset % 8;
        ulong bits = 0;
        for (int i = 0; i <= Math.Min(endByte - startByte, 7); i++) 
            bits |= (ulong)bytes[startByte + i] << (56 - (i * 8));
        
        if (skipBits != 0) Read(ref bits, skipBits);
        offset += length;
        return Read(ref bits, length);
    

    public static void Write(ref ulong x, int length, int value) 
        ulong mask = 0xFFFFFFFFFFFFFFFF >> (64 - length);
        x = (x << length) | ((ulong)value & mask);
    

    public static byte[] CopyBlock(byte[] bytes, int offset, int length) 
        int startByte = offset / 8;
        int endByte = (offset + length - 1) / 8;
        int shiftA = offset % 8;
        int shiftB = 8 - shiftA;
        byte[] dst = new byte[(length + 7) / 8];
        if (shiftA == 0) 
            Buffer.BlockCopy(bytes, startByte, dst, 0, dst.Length);
        
        else 
            int i;
            for (i = 0; i < endByte - startByte; i++) 
                dst[i] = (byte)((bytes[startByte + i] << shiftA) | (bytes[startByte + i + 1] >> shiftB));
            
            if (i < dst.Length) 
                dst[i] = (byte)(bytes[startByte + i] << shiftA);
            
        
        dst[dst.Length - 1] &= (byte)(0xFF << ((dst.Length * 8) - length));
        return dst;
    


public static class BitConverterBE 
    public static ulong ToUInt64(byte[] value, int startIndex) 
        return
            ((ulong)value[startIndex    ] << 56) |
            ((ulong)value[startIndex + 1] << 48) |
            ((ulong)value[startIndex + 2] << 40) |
            ((ulong)value[startIndex + 3] << 32) |
            ((ulong)value[startIndex + 4] << 24) |
            ((ulong)value[startIndex + 5] << 16) |
            ((ulong)value[startIndex + 6] <<  8) |
            ((ulong)value[startIndex + 7]      );
    

    public static uint ToUInt32(byte[] value, int startIndex) 
        return
            ((uint)value[startIndex    ] << 24) |
            ((uint)value[startIndex + 1] << 16) |
            ((uint)value[startIndex + 2] <<  8) |
            ((uint)value[startIndex + 3]      );
    

    public static ushort ToUInt16(byte[] value, int startIndex) 
        return (ushort)(
            (value[startIndex    ] <<  8) |
            (value[startIndex + 1]      ));
    

    public static byte[] GetBytes(ulong value) 
        byte[] buff = new byte[8];
        buff[0] = (byte)(value >> 56);
        buff[1] = (byte)(value >> 48);
        buff[2] = (byte)(value >> 40);
        buff[3] = (byte)(value >> 32);
        buff[4] = (byte)(value >> 24);
        buff[5] = (byte)(value >> 16);
        buff[6] = (byte)(value >>  8);
        buff[7] = (byte)(value      );
        return buff;
    

    public static byte[] GetBytes(uint value) 
        byte[] buff = new byte[4];
        buff[0] = (byte)(value >> 24);
        buff[1] = (byte)(value >> 16);
        buff[2] = (byte)(value >>  8);
        buff[3] = (byte)(value      );
        return buff;
    

    public static byte[] GetBytes(ushort value) 
        byte[] buff = new byte[2];
        buff[0] = (byte)(value >>  8);
        buff[1] = (byte)(value      );
        return buff;
    


public static class BitConverterLE 
    public static byte[] GetBytes(ulong value) 
        byte[] buff = new byte[8];
        buff[0] = (byte)(value      );
        buff[1] = (byte)(value >>  8);
        buff[2] = (byte)(value >> 16);
        buff[3] = (byte)(value >> 24);
        buff[4] = (byte)(value >> 32);
        buff[5] = (byte)(value >> 40);
        buff[6] = (byte)(value >> 48);
        buff[7] = (byte)(value >> 56);
        return buff;
    

    public static byte[] GetBytes(uint value) 
        byte[] buff = new byte[4];
        buff[0] = (byte)(value      );
        buff[1] = (byte)(value >>  8);
        buff[2] = (byte)(value >> 16);
        buff[3] = (byte)(value >> 24);
        return buff;
    

    public static byte[] GetBytes(ushort value) 
        byte[] buff = new byte[2];
        buff[0] = (byte)(value      );
        buff[1] = (byte)(value >>  8);
        return buff;
    

现在实现 Audio Helper 类和接口:

    interface IAudioWriter
    
    void WriteChunk(byte[] chunk, uint timeStamp);
    void Finish();
    string Path  get; 


    class AACWriter : IAudioWriter
    
    string _path;
    FileStream _fs;
    int _aacProfile;
    int _sampleRateIndex;
    int _channelConfig;

    public AACWriter(string path) 
        _path = path;
        _fs = new FileStream(path, FileMode.Create, FileAccess.Write, FileShare.Read, 65536);
    

    public void WriteChunk(byte[] chunk, uint timeStamp)
            
        if (chunk.Length < 1) return;

        if (chunk[0] == 0)  // Header
            if (chunk.Length < 3) return;

            ulong bits = (ulong)BitConverterBE.ToUInt16(chunk, 1) << 48;

            _aacProfile = BitHelper.Read(ref bits, 5) - 1;
            _sampleRateIndex = BitHelper.Read(ref bits, 4);
            _channelConfig = BitHelper.Read(ref bits, 4);

            if ((_aacProfile < 0) || (_aacProfile > 3))
                throw new Exception("Unsupported AAC profile.");
            if (_sampleRateIndex > 12)
                throw new Exception("Invalid AAC sample rate index.");
            if (_channelConfig > 6)
                throw new Exception("Invalid AAC channel configuration.");
        
        else  // Audio data
            int dataSize = chunk.Length - 1;
            ulong bits = 0;

            // Reference: WriteADTSHeader from FAAC's bitstream.c

            BitHelper.Write(ref bits, 12, 0xFFF);
            BitHelper.Write(ref bits,  1, 0);
            BitHelper.Write(ref bits,  2, 0);
            BitHelper.Write(ref bits,  1, 1);
            BitHelper.Write(ref bits,  2, _aacProfile);
            BitHelper.Write(ref bits,  4, _sampleRateIndex);
            BitHelper.Write(ref bits,  1, 0);
            BitHelper.Write(ref bits,  3, _channelConfig);
            BitHelper.Write(ref bits,  1, 0);
            BitHelper.Write(ref bits,  1, 0);
            BitHelper.Write(ref bits,  1, 0);
            BitHelper.Write(ref bits,  1, 0);
            BitHelper.Write(ref bits, 13, 7 + dataSize);
            BitHelper.Write(ref bits, 11, 0x7FF);
            BitHelper.Write(ref bits,  2, 0);

            _fs.Write(BitConverterBE.GetBytes(bits), 1, 7);
            _fs.Write(chunk, 1, dataSize);
        
    

    public void Finish() 
        _fs.Close();
    

    public string Path 
        get 
            return _path;
        
    

现在你需要自己做的是,从第一个 AAC 文件中逐个读取块并写入它们,然后从第二个 AAC 文件中逐个读取块并将它们附加到中间文件。

注意,上面的代码是 C#,所以你必须使用 wrapping 来模拟 C# 的 ref 效果,只需替换:

ref Type variable_name

与:

_<Type> variable_name

【讨论】:

即使这样仍然不够,因为有一堆 MPEG4 元数据(如 stsz 样本大小表)必须智能组合。 您的建议属于 MP4 容器的范围。每个块中的ADTSHeader 为解码器提供了足够的信息以正确解码音频,即 AAC 原始文件。 @duskwuff 示例代码中对"mdat"的引用让我觉得它实际上是一个扩展名错误的MPEG4。

以上是关于使用 Java 合并 2 个 AAC 文件的主要内容,如果未能解决你的问题,请参考以下文章

FFmpeg 命令行工具ffmpeg

合并iPhone上的音频文件

2020-03-11 FFmpeg——mp4合并中的坑

Java - 合并超过 2 个 .wav 文件时遇到问题

如何使用Java将> 1000个xml文件合并为一个

java编程将若干个excel文件合并成一个csv文件,文件变大的很多,怎么解决