1.变量初始化 申明的成员变量在构造方法内初始化,这些常量值是从解码规范的文档里直接COPY过来的。
2.帧的数据结构 以Layer2编码的文件按帧存放,解码时也是逐帧解码。每一帧内依次存放位分配信息、增益因子选择信息、增益因子、主数据。采用标准立体声编码的Layer2一帧内的主数据有12个粒度组(granule),一个粒度组内最多可有32个子带(subband),每个子带两个声道。每个声道内3组样本值连续存放,每一组32个值。
3.解码过程 Layer2编码不采用心理声学模型,解码端不用IMDCT;Layer2编码端没有哈夫曼编码。逆量化没有采用解码Layer3那样的查表法而是直接运算,Layer2的逆量化公式也比Layer3的简单得多。解码一帧Layer2只需6步,这6个步骤在decodeFrame方法内注解出来,每一步的细节一看就懂,不再赘述。解码Layer2的源码如下:
/* * Layer2.java -- MPEG 1.0/2.0/2.5 Audio Layer II Decoder * Copyright (C) 2010 * * This program is free software: you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program. If not, see <http://www.gnu.org/licenses/>. * * If you would like to negotiate alternate licensing terms, you may do * so by contacting the author: <http://jmp123.sf.net/> */ package decoder; public final class Layer2 implements ILayer123 { private static Header header; private static BitStream bs; private static Synthesis filter; private static int nch, aidx, sblimit; private static byte[][] allocation; //[2][32] private static byte[][] nbal; //[5][] private static byte[][] sbquant_offset; //[5][] private static byte[][] scfsi; //[2][32] private static byte[][][] scalefactor; //[2][32][3] private static int[] cq_steps; //[17] private static float[] cq_C; //[17] private static float[] cq_D; //[17] private static byte[] cq_bits; //[17] private static byte[] bitalloc_offset; //[8] private static byte[][] offset_table; //[6][15] private static byte[] group; //[17] private static int[] samplecode; //[3] private static float[][][] syin; //[2][3][32] // Layer1也用到factor[] public static float[] factor; //[63] public Layer2(BitStream bitstream,Header h, Synthesis filter, int wch) { header = h; bs = bitstream; this.filter = filter; nbal = new byte[5][]; // ISO/IEC 11172-3 Table 3-B.2a nbal[0] = new byte[] { 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 2, 2, 2 }; // ISO/IEC 11172-3 Table 3-B.2b nbal[1] = new byte[] { 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 2, 2, 2, 2, 2, 2 }; // ISO/IEC 11172-3 Table 3-B.2c nbal[2] = new byte[] { 4, 4, 3, 3, 3, 3, 3, 3 }; // ISO/IEC 11172-3 Table 3-B.2d nbal[3] = new byte[] { 4, 4, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3 }; // ISO/IEC 13818-3 Table B.1 nbal[4] = new byte[] { 4, 4, 4, 4, 3, 3, 3, 3, 3, 3, 3, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2 }; // ISO/IEC 11172-3 Table 3-B.1 factor = new float[] {2.00000000000000f, 1.58740105196820f, 1.25992104989487f, 1.00000000000000f, 0.79370052598410f, 0.62996052494744f, 0.50000000000000f, 0.39685026299205f, 0.31498026247372f, 0.25000000000000f, 0.19842513149602f, 0.15749013123686f, 0.12500000000000f, 0.09921256574801f, 0.07874506561843f, 0.06250000000000f, 0.04960628287401f, 0.03937253280921f, 0.03125000000000f, 0.02480314143700f, 0.01968626640461f, 0.01562500000000f, 0.01240157071850f, 0.00984313320230f, 0.00781250000000f, 0.00620078535925f, 0.00492156660115f, 0.00390625000000f, 0.00310039267963f, 0.00246078330058f, 0.00195312500000f, 0.00155019633981f, 0.00123039165029f, 0.00097656250000f, 0.00077509816991f, 0.00061519582514f, 0.00048828125000f, 0.00038754908495f, 0.00030759791257f, 0.00024414062500f, 0.00019377454248f, 0.00015379895629f, 0.00012207031250f, 0.00009688727124f, 0.00007689947814f, 0.00006103515625f, 0.00004844363562f, 0.00003844973907f, 0.00003051757813f, 0.00002422181781f, 0.00001922486954f, 0.00001525878906f, 0.00001211090890f, 0.00000961243477f, 0.00000762939453f, 0.00000605545445f, 0.00000480621738f, 0.00000381469727f, 0.00000302772723f, 0.00000240310869f, 0.00000190734863f, 0.00000151386361f, 0.00000120155435f }; // cq_xxx: Layer II classes of quantization, ISO/IEC 11172-3 Table 3-B.4 cq_steps = new int[] { 3, 5, 7, 9, 15, 31, 63, 127, 255, 511, 1023, 2047, 4095, 8191, 16383, 32767, 65535 }; cq_C = new float[] { 1.3333333f, 1.6f, 1.1428571f, 1.77777778f, 1.0666667f, 1.0322581f, 1.015873f, 1.007874f, 1.0039216f, 1.0019569f, 1.0009775f, 1.0004885f, 1.0002442f, 1.000122f, 1.000061f, 1.0000305f, 1.00001525902f }; cq_D = new float[] { 0.5f, 0.5f, 0.25f, 0.5f, 0.125f, 0.0625f, 0.03125f, 0.015625f, 0.0078125f, 0.00390625f, 0.001953125f, 0.0009765625f, 0.00048828125f, 0.00024414063f, 0.00012207031f, 0.00006103516f, 0.00003051758f }; cq_bits = new byte[] {5,7,3,10,4,5,6,7,8,9,10,11,12,13,14,15,16}; sbquant_offset = new byte[][] { // ISO/IEC 11172-3 Table 3-B.2a {7,7,7,6,6,6,6,6,6,6,6,3,3,3,3,3,3,3,3,3, 3,3,3,0,0,0,0}, // ISO/IEC 11172-3 Table 3-B.2b {7,7,7,6,6,6,6,6,6,6,6,3,3,3,3,3,3,3,3,3, 3,3,3,0,0,0,0,0,0,0}, // ISO/IEC 11172-3 Table 3-B.2c {5,5,2,2,2,2,2,2}, // ISO/IEC 11172-3 Table 3-B.2d {5,5,2,2,2,2,2,2,2,2,2,2}, // ISO/IEC 13818-3 Table B.1 {4,4,4,4,2,2,2,2,2,2,2,1,1,1,1,1,1,1,1,1, 1,1,1,1,1,1,1,1,1,1} }; bitalloc_offset = new byte[] { 0, 3, 3, 1, 2, 3, 4, 5 }; offset_table = new byte[][] { { 0, 1, 16 }, { 0, 1, 2, 3, 4, 5, 16 }, { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14 }, { 0, 1, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15 }, { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 16 }, { 0, 2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16 } }; group = new byte[] { 2, 3, 0, 4, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }; allocation = new byte[2][32]; scfsi = new byte[2][32]; scalefactor = new byte[2][32][3]; samplecode = new int[3]; syin = new float[2][3][32]; //nch,aidx,sblimit... nch = header.getChannels(); int bitrate = header.getBitrate() / nch; if(header.getVersion() == Header.MPEG1) if(bitrate <= 48) aidx = (bitrate == 32) ? 3 : 2; else if(bitrate <= 80) aidx = 0; else aidx = (bitrate == 48) ? 0 : 1; else //mpeg 2.0/2.5 aidx = 4; byte[] limit = {27, 30, 8, 12, 30}; sblimit = limit[aidx]; } private void requantization(int index, int gr, int ch, int sb) { int nb, s, c; int nlevels = cq_steps[index]; if ((nb = group[index]) != 0) { // degrouping c = bs.getBits17(cq_bits[index]); for (s = 0; s < 3; s++) { samplecode[s] = c % nlevels; c /= nlevels; } nlevels = (1 << nb) - 1; //用于计算fractional } else { nb = cq_bits[index]; for (s = 0; s < 3; s++) samplecode[s] = bs.getBits17(nb); } for (s = 0; s < 3; s++) { float fractional = 2.0f * samplecode[s] / (nlevels + 1) - 1.0f; // s'' = C * (s''' + D) syin[ch][s][sb] = cq_C[index] * (fractional + cq_D[index]); // s' = factor * s'' syin[ch][s][sb] *= factor[scalefactor[ch][sb][gr >> 2]]; } } private void stereo(int index, int gr, int sb) { int nb, s, c; int nlevels = cq_steps[index]; if ((nb = group[index]) != 0) { c = bs.getBits17(cq_bits[index]); for (s = 0; s < 3; s++) { samplecode[s] = c % nlevels; c /= nlevels; } nlevels = (1 << nb) - 1; } else { nb = cq_bits[index]; for (s = 0; s < 3; s++) samplecode[s] = bs.getBits17(nb); } for (s = 0; s < 3; s++) { float fractional = 2.0f * samplecode[s] / (nlevels + 1) - 1.0f; // s'' = C * (s''' + D) syin[0][s][sb] = syin[1][s][sb] = cq_C[index] * (fractional + cq_D[index]); // s' = factor * s'' syin[0][s][sb] *= factor[scalefactor[0][sb][gr >> 2]]; syin[1][s][sb] *= factor[scalefactor[1][sb][gr >> 2]]; } } public void decodeFrame() throws Exception { int maindata_begin ,bound, sb, ch; int slots = header.getMainDataSlots(); bs.append(slots); maindata_begin = bs.getBytePos(); bound = (header.getMode() == 1) ? ((header.getModeExtension() + 1) * 4) : 32; if(bound > sblimit) bound = sblimit; /* * 1. Bit allocation decoding */ for (sb = 0; sb < bound; sb++) for (ch = 0; ch < nch; ch++) allocation[ch][sb] = (byte)bs.getBits9(nbal[aidx][sb]); // 2..4 bits for (sb = bound; sb < sblimit; sb++) allocation[1][sb] = allocation[0][sb] = (byte)bs.getBits9(nbal[aidx][sb]); /* * 2. Scalefactor selection information decoding */ for (sb = 0; sb < sblimit; sb++) for (ch = 0; ch < nch; ch++) if (allocation[ch][sb] != 0) scfsi[ch][sb] = (byte)bs.getBits9(2); else scfsi[ch][sb] = 0; /* * 3. Scalefactor decoding */ for (sb = 0; sb < sblimit; ++sb) for (ch = 0; ch < nch; ++ch) if (allocation[ch][sb] != 0) { scalefactor[ch][sb][0] = (byte)bs.getBits9(6); switch (scfsi[ch][sb]) { case 2: scalefactor[ch][sb][2] = scalefactor[ch][sb][1] = scalefactor[ch][sb][0]; break; case 0: scalefactor[ch][sb][1] = (byte)bs.getBits9(6); case 1: case 3: scalefactor[ch][sb][2] = (byte)bs.getBits9(6); } if ((scfsi[ch][sb] & 1) == 1) scalefactor[ch][sb][1] = scalefactor[ch][sb][scfsi[ch][sb] - 1]; } int gr, index, s; for (gr = 0; gr < 12; gr++) { /* * 4. Requantization of subband samples */ for (sb = 0; sb < bound; sb++) for (ch = 0; ch < nch; ch++) if ((index = allocation[ch][sb]) != 0) { index = offset_table[bitalloc_offset[sbquant_offset[aidx][sb]]][index - 1]; requantization(index, gr, ch, sb); } else syin[ch][0][sb] = syin[ch][1][sb] = syin[ch][2][sb] = 0; //mode=1(Joint Stereo) for (sb = bound; sb < sblimit; sb++) if ((index = allocation[0][sb]) != 0) { index = offset_table[bitalloc_offset[sbquant_offset[aidx][sb]]][index - 1]; stereo(index, gr, sb); } else for (ch = 0; ch < nch; ch++) syin[ch][0][sb] = syin[ch][1][sb] = syin[ch][2][sb] = 0; for (ch = 0; ch < nch; ch++) for (s = 0; s < 3; s++) for (sb = sblimit; sb < 32; sb++) syin[ch][s][sb] = 0; /* * 5. Synthesis subband filter */ for (ch = 0; ch < nch; ch++) for (s = 0; s < 3; s++) filter.synthesisSubBand(syin[ch][s], ch); } // for gr=0 to 12 /* * 6. Ancillary bits */ int discard = slots + maindata_begin - bs.getBytePos(); bs.skipBytes(discard); } }