Context Navigation

← Previous Change
Next Change →

Changeset 1130 for OniSplit/Sound

Timestamp:

May 28, 2020, 11:28:44 PM (5 years ago)

Author:

geyser

Message:

Minor fixes and features in SNDD export: "transcoding" forbidden, standard-compliant MSADPCM (with padding and "fact" section), PCM export (with -extract:pcm).

Location:

OniSplit/Sound

Files:

: 3 edited

AifExporter.cs (modified) (1 diff)
SoundData.cs (modified) (2 diffs)
WavExporter.cs (modified) (4 diffs)

Legend:

: Unmodified
: Added
: Removed

OniSplit/Sound/AifExporter.cs

-              r1114
+              r1130
             using (var writer = new BinaryWriter(stream))
+            {
+                if (!(sound.IsIMA4))
+                {
+                    throw new NotSupportedException("Transcoding from PC ADPCM to Mac/demo ADPCM not supported!");
+                }
                 writer.Write(Utils.ByteSwap(fcc_FORM));
                 writer.Write(Utils.ByteSwap(50 + sound.Data.Length));

OniSplit/Sound/SoundData.cs

-              r1114
+              r1130
     internal class SoundData
+    {
+        public bool IsIMA4;
         public int SampleRate;
         public int ChannelCount;
 …
                     sound.SampleRate = 22050;
                     reader.Skip(4);
+                    sound.IsIMA4 = true;
+                }
                 else
+                {
                     reader.Skip(6);
+                    reader.Skip(6); // ADPCM format identifiers (change to support PCM?)
                     sound.ChannelCount = reader.ReadInt16();
                     sound.SampleRate = reader.ReadInt32();
                     reader.Skip(44);
+                    sound.IsIMA4 = false;
+                }

OniSplit/Sound/WavExporter.cs

-              r1126
+              r1130
+    {
         #region Private data
+        private bool convert_to_PCM;
         private const int fcc_RIFF = 0x46464952;
         private const int fcc_WAVE = 0x45564157;
         private const int fcc_fmt = 0x20746d66;
+        private const int fcc_fact = 0x74636166;
         private const int fcc_data = 0x61746164;
         private static readonly byte[] formatTemplate = new byte[50]
+        {
 x02, 0,    // format ID (always 2)
+        private static readonly byte[] formatTemplate_ADPCM = new byte[50]
+        {
+x02, 0,    // format ID (2 for ADPCM)
 , 0,       // ChannelCount (overwritten)
 x22, 0x56, 0, 0, // SampleRate (usually 22050, can be 44100)
 …
 , 0x02,    // block alignment (default 512, can be 1024)
 x04, 0,    // bits per sample (always 4)
 x20, 0,    // size of extended header block
+x20, 0,    // size of extended ADPCM header block
 xf4, 0x03, // samples per block (usually 1012, can be 2036)
 x07, 0,    // standard ADPCM coefficient table (always the same)
 …
         };
+        private static readonly byte[] formatTemplate_PCM = new byte[16]
+        {
+x01, 0,    // format ID (1 for linear PCM)
+, 0,       // ChannelCount (overwritten)
+x22, 0x56, 0, 0, // SampleRate (usually 22050, can be 44100)
+, 0, 0, 0, // data rate in bytes/s (computed and overwritten)
+x02, 0,    // block size (2 bytes for mono, 4 for stereo)
+x10, 0     // bits per sample (always 16)
+        };
+        private static readonly byte[] factTemplate = new byte[4]
+        {
+, 0, 0, 0  // sample count (computed and overwritten)
+        };
+        private static readonly int[] ima_index_table = new int[16]
+        {
+           -1, -1, -1, -1, 2, 4, 6, 8,
+           -1, -1, -1, -1, 2, 4, 6, 8
+        };
+        private static readonly int[] ima_step_table = new int[89]
+        {
+, 8, 9, 10, 11, 12, 13, 14, 16, 17,
+, 21, 23, 25, 28, 31, 34, 37, 41, 45,
+, 55, 60, 66, 73, 80, 88, 97, 107, 118,
+, 143, 157, 173, 190, 209, 230, 253, 279, 307,
+, 371, 408, 449, 494, 544, 598, 658, 724, 796,
+, 963, 1060, 1166, 1282, 1411, 1552, 1707, 1878, 2066,
+, 2499, 2749, 3024, 3327, 3660, 4026, 4428, 4871, 5358,
+, 6484, 7132, 7845, 8630, 9493, 10442, 11487, 12635, 13899,
+, 16818, 18500, 20350, 22385, 24623, 27086, 29794, 32767
+        };
+        private static readonly int[] msadpcm_adapt_table = new int[16]
+        {
+, 230, 230, 230, 307, 409, 512, 614,
+, 614, 512, 409, 307, 230, 230, 230
+        };
+        private static readonly int[] msadpcm_coeff_table1 = new int[7]
+        {
+, 512, 0, 192, 240, 460, 392
+        };
+        private static readonly int[] msadpcm_coeff_table2 = new int[7]
+        {
+, -256, 0, 64, 0, -208, -232
+        };
         #endregion
         public WavExporter(InstanceFileManager fileManager, string outputDirPath)
+        public WavExporter(InstanceFileManager fileManager, string outputDirPath, bool convertToPCM = false)
             : base(fileManager, outputDirPath)
+        {
+            convert_to_PCM = convertToPCM;
+        }
+        private static void ClampToRange(ref int value, int lower, int upper)
+        {
+            if (value > upper)
+                value = upper;
+            if (value < lower)
+                value = lower;
+        }
+        protected Int16 NibbletoSampleIMA4(ref int predictor, ref int step_index, Byte nibble)
+        {
+            int step = ima_step_table[step_index];
+            step_index += ima_index_table[nibble];
+            ClampToRange(ref step_index, 0, 88);
+            int diff = step >> 3;
+            if ((nibble & 0x04) != 0) diff +=  step;
+            if ((nibble & 0x02) != 0) diff += (step >> 1);
+            if ((nibble & 0x01) != 0) diff += (step >> 2);
+            if ((nibble & 0x08) != 0)
+                predictor -= diff;
+            else
+                predictor += diff;
+            ClampToRange(ref predictor, -32768, 32767);
+            return (Int16)predictor;
+        }
+        protected Int16 NibbletoSampleMSADPCM(ref Int16 sample1, ref Int16 sample2, ref UInt16 delta, Byte pred_index, Byte nibble)
+        {
+            int coeff1 = msadpcm_coeff_table1[pred_index];
+            int coeff2 = msadpcm_coeff_table2[pred_index];
+            int prediction = ((int)sample1 * (int)coeff1 + (int)sample2 * (int)coeff2) >> 8;
+            int snibble = (nibble < 8) ? nibble : (nibble - 16);
+            int correction = snibble * (int)delta;
+            int sample = prediction + correction;
+            ClampToRange(ref sample, -32768, 32767);
+            sample2 = sample1;
+            sample1 = (Int16)sample;
+            int newDelta = delta * msadpcm_adapt_table[nibble];
+            newDelta >>= 8;
+            ClampToRange(ref newDelta, 16, 65535);
+            delta = (UInt16)newDelta;
+            return (Int16)sample;
+        }
 …
             using (var writer = new BinaryWriter(stream))
+            {
+                var format = (byte[])formatTemplate.Clone();
+                var blockAlignment = 512 * sound.ChannelCount * sound.SampleRate / 22050;
+                var samplesPerBlock = 2 + (blockAlignment - sound.ChannelCount * 7) * 8 / sound.ChannelCount / 4;
+                var averageRate = sound.SampleRate * blockAlignment / samplesPerBlock;
+                Array.Copy(BitConverter.GetBytes(sound.ChannelCount), 0, format, 2, 2);
+                Array.Copy(BitConverter.GetBytes(sound.SampleRate), 0, format, 4, 4);
+                Array.Copy(BitConverter.GetBytes(averageRate), 0, format, 8, 4);
+                Array.Copy(BitConverter.GetBytes(blockAlignment), 0, format, 12, 2);
+                Array.Copy(BitConverter.GetBytes(samplesPerBlock), 0, format, 18, 2);
+                writer.Write(fcc_RIFF);
+                writer.Write(8 + format.Length + 8 + sound.Data.Length);
+                writer.Write(fcc_WAVE);
+                //
+                // write format chunk
+                //
+                writer.Write(fcc_fmt);
+                writer.Write(format.Length);
+                writer.Write(format);
+                //
+                // write data chunk
+                //
+                writer.Write(fcc_data);
+                writer.Write(sound.Data.Length);
+                writer.Write(sound.Data);
+                var blockSizeADPCM = 512 * sound.ChannelCount * sound.SampleRate / 22050;
+                int wholeBlocks = sound.Data.Length / blockSizeADPCM;
+                int leftoverBytes = sound.Data.Length - (wholeBlocks * blockSizeADPCM);
+                int leftoverSamples = 8 * (leftoverBytes - 7 * sound.ChannelCount)
+                                      / 4 / sound.ChannelCount + 2; // 4 bits per sample
+                int paddingBytes = 0;
+                if (leftoverBytes > 0) // incomplete trailing block
+                    paddingBytes = blockSizeADPCM - leftoverBytes;
+                var samplesPerBlock = 2 + (blockSizeADPCM - sound.ChannelCount * 7) * 8 / sound.ChannelCount / 4;
+                Int32 sampleCount = sampleCount = wholeBlocks * samplesPerBlock + leftoverSamples;
+                if (sound.IsIMA4) // IMA4 ADPCM format
+                {
+                    blockSizeADPCM = 34 * sound.ChannelCount;
+                    samplesPerBlock = 64;
+                    sampleCount = (sound.Data.Length / blockSizeADPCM) * samplesPerBlock;
+                }
+                if (!convert_to_PCM)
+                {
+                    if (sound.IsIMA4)
+                    {
+                        throw new NotSupportedException("Transcoding from Mac/demo ADPCM to PC ADPCM not supported! Please use -extract:pcm");
+                    }
+                    var format = (byte[])formatTemplate_ADPCM.Clone();
+                    var fact = (byte[])factTemplate.Clone(); // needed for ADPCM (to specify the actual sample count)
+                    var averageRate = sound.SampleRate * blockSizeADPCM / samplesPerBlock;
+                    Array.Copy(BitConverter.GetBytes(sound.ChannelCount), 0, format, 2, 2);
+                    Array.Copy(BitConverter.GetBytes(sound.SampleRate), 0, format, 4, 4);
+                    Array.Copy(BitConverter.GetBytes(averageRate), 0, format, 8, 4);
+                    Array.Copy(BitConverter.GetBytes(blockSizeADPCM), 0, format, 12, 2);
+                    Array.Copy(BitConverter.GetBytes(samplesPerBlock), 0, format, 18, 2);
+                    Array.Copy(BitConverter.GetBytes(sampleCount), 0, fact, 0, 4);
+                    writer.Write(fcc_RIFF);
+                    writer.Write(8 + format.Length + 8 + fact.Length + 8 + sound.Data.Length + paddingBytes);
+                    writer.Write(fcc_WAVE);
+                    //
+                    // write format chunk
+                    //
+                    writer.Write(fcc_fmt);
+                    writer.Write(format.Length);
+                    writer.Write(format);
+                    //
+                    // write fact chunk
+                    //
+                    writer.Write(fcc_fact);
+                    writer.Write(fact.Length);
+                    writer.Write(fact);
+                    //
+                    // write data chunk
+                    //
+                    writer.Write(fcc_data);
+                    writer.Write(sound.Data.Length + paddingBytes);
+                    writer.Write(sound.Data);
+                    Byte c = 0;
+                    for (int i = 0; i < paddingBytes; i++)
+                        writer.Write(c);
+                }
+                else
+                {
+                    var format = (byte[])formatTemplate_PCM.Clone();
+                    var blockSizePCM = 2 * sound.ChannelCount; // 16-bit samples or sample pairs
+                    samplesPerBlock = 2;
+                    var averageRate = sound.SampleRate * blockSizePCM / samplesPerBlock;
+                    Array.Copy(BitConverter.GetBytes(sound.ChannelCount), 0, format, 2, 2);
+                    Array.Copy(BitConverter.GetBytes(sound.SampleRate), 0, format, 4, 4);
+                    Array.Copy(BitConverter.GetBytes(averageRate), 0, format, 8, 4);
+                    Array.Copy(BitConverter.GetBytes(blockSizePCM), 0, format, 12, 2);
+                    int dataSize = blockSizePCM * sampleCount;
+                    writer.Write(fcc_RIFF);
+                    writer.Write(8 + format.Length + 8 + dataSize);
+                    writer.Write(fcc_WAVE);
+                    //
+                    // write format chunk
+                    //
+                    writer.Write(fcc_fmt);
+                    writer.Write(format.Length);
+                    writer.Write(format);
+                    //
+                    // write data chunk
+                    //
+                    var samplesL = new Int16[sampleCount];
+                    var samplesR = new Int16[sampleCount];
+                    if (sound.IsIMA4) // decode IMA4 into linear signed 16-bit PCM
+                    {
+                        int pos = 0;
+                        int iSampleL = 0;
+                        int predictorL = 0;
+                        int stepIndexL = 0;
+                        int iSampleR = 0;
+                        int predictorR = 0;
+                        int stepIndexR = 0;
+                        int nBlocks = sound.Data.Length / blockSizeADPCM;
+                        for (int block = 0; block < nBlocks; block++)
+                        {
+                            byte headerHiL = sound.Data[pos++];
+                            byte headerLoL = sound.Data[pos++];
+                            if (block == 0) // non-standard decoding: predictor initialization ignored after start
+                            {
+                                predictorL = ((((headerHiL << 1) | (headerLoL >> 7))) << 7);
+                                if (predictorL > 32767) predictorL -= 65536;
+                            }
+                            stepIndexL = headerLoL & 0x7f;
+                            for (int b = 0; b < 32; b++)
+                            {
+                                Byte nibblesL = sound.Data[pos++];
+                                Byte nibbleHiL = (Byte)(nibblesL >> 4);
+                                Byte nibbleLoL = (Byte)(nibblesL & 0xF);
+                                samplesL[iSampleL++] = NibbletoSampleIMA4(ref predictorL, ref stepIndexL, nibbleLoL);
+                                samplesL[iSampleL++] = NibbletoSampleIMA4(ref predictorL, ref stepIndexL, nibbleHiL);
+                            }
+                            if (sound.ChannelCount == 2)
+                            {
+                                byte headerHiR = sound.Data[pos++];
+                                byte headerLoR = sound.Data[pos++];
+                                if (block == 0) // non-standard decoding: predictor initialization ignored after start
+                                {
+                                    predictorR = ((((headerHiR << 1) | (headerLoR >> 7))) << 7);
+                                    if (predictorR > 32767) predictorR -= 65536;
+                                }
+                                stepIndexR = headerLoR & 0x7f;
+                                for (int b = 0; b < 32; b++)
+                                {
+                                    Byte nibblesR = sound.Data[pos++];
+                                    Byte nibbleHiR = (Byte)(nibblesR >> 4);
+                                    Byte nibbleLoR = (Byte)(nibblesR & 0xF);
+                                    samplesR[iSampleR++] = NibbletoSampleIMA4(ref predictorR, ref stepIndexR, nibbleLoR);
+                                    samplesR[iSampleR++] = NibbletoSampleIMA4(ref predictorR, ref stepIndexR, nibbleHiR);
+                                }
+                            }
+                        }
+                    }
+                    else // decode MSADPCM into linear signed 16-bit PCM
+                    {
+                        int pos = 0;
+                        Byte pred_indexL = 0, pred_indexR = 0;
+                        UInt16 deltaL = 0, deltaR = 0;
+                        int iSampleL = 0;
+                        int iSampleR = 0;
+                        Int16 sample1L = 0, sample2L = 0;
+                        Int16 sample1R = 0, sample2R = 0;
+                        while (pos < sound.Data.Length)
+                        {
+                            if ((pos % blockSizeADPCM) == 0) // read block header
+                            {
+                                pred_indexL = sound.Data[pos++];
+                                if (sound.ChannelCount == 2)
+                                    pred_indexR = sound.Data[pos++];
+                                Byte deltaLo = sound.Data[pos++];
+                                Byte deltaHi = sound.Data[pos++];
+                                deltaL = (UInt16)(deltaLo + 256 * deltaHi);
+                                if (sound.ChannelCount == 2)
+                                {
+                                    deltaLo = sound.Data[pos++];
+                                    deltaHi = sound.Data[pos++];
+                                    deltaR = (UInt16)(deltaLo + 256 * deltaHi);
+                                }
+                                Byte sampleLo = sound.Data[pos++];
+                                Byte sampleHi = sound.Data[pos++];
+                                UInt16 usample = (UInt16)(sampleLo + 256 * sampleHi);
+                                sample1L = (Int16)((usample < 32767) ? usample : (usample - 65536));
+                                if (sound.ChannelCount == 2)
+                                {
+                                    sampleLo = sound.Data[pos++];
+                                    sampleHi = sound.Data[pos++];
+                                    usample = (UInt16)(sampleLo + 256 * sampleHi);
+                                    sample1R = (Int16)((usample < 32767) ? usample : (usample - 65536));
+                                }
+                                sampleLo = sound.Data[pos++];
+                                sampleHi = sound.Data[pos++];
+                                usample = (UInt16)(sampleLo + 256 * sampleHi);
+                                sample2L = (Int16)((usample < 32767) ? usample : (usample - 65536));
+                                if (sound.ChannelCount == 2)
+                                {
+                                    sampleLo = sound.Data[pos++];
+                                    sampleHi = sound.Data[pos++];
+                                    usample = (UInt16)(sampleLo + 256 * sampleHi);
+                                    sample2R = (Int16)((usample < 32767) ? usample : (usample - 65536));
+                                }
+                                samplesL[iSampleL++] = sample2L;
+                                samplesL[iSampleL++] = sample1L;
+                                if (sound.ChannelCount == 2)
+                                {
+                                    samplesR[iSampleR++] = sample2R;
+                                    samplesR[iSampleR++] = sample1R;
+                                }
+                            }
+                            // read pair of nibbles
+                            Byte nibbles = sound.Data[pos++];
+                            Byte nibbleHi = (Byte)(nibbles >> 4);
+                            Byte nibbleLo = (Byte)(nibbles & 0xF);
+                            samplesL[iSampleL++] = NibbletoSampleMSADPCM(ref sample1L, ref sample2L, ref deltaL, pred_indexL, nibbleHi);
+                            if (sound.ChannelCount == 2)
+                                samplesR[iSampleR++] = NibbletoSampleMSADPCM(ref sample1R, ref sample2R, ref deltaR, pred_indexR, nibbleLo);
+                            else
+                                samplesL[iSampleL++] = NibbletoSampleMSADPCM(ref sample1L, ref sample2L, ref deltaL, pred_indexL, nibbleLo);
+                        }
+                    }
+                    writer.Write(fcc_data);
+                    writer.Write(dataSize);
+                    for (int smp = 0; smp < sampleCount; smp++)
+                    {
+                        writer.Write(samplesL[smp]);
+                        if(sound.ChannelCount == 2)
+                            writer.Write(samplesR[smp]);
+                    }
+                }
+            }
+        }

Note: See TracChangeset for help on using the changeset viewer.