MP3Loader.cpp 37 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871
  1. /*
  2. * Copyright (c) 2021, Arne Elster <arne@elster.li>
  3. *
  4. * SPDX-License-Identifier: BSD-2-Clause
  5. */
  6. #include "MP3Loader.h"
  7. #include "MP3HuffmanTables.h"
  8. #include "MP3Tables.h"
  9. #include "MP3Types.h"
  10. #include <AK/FixedArray.h>
  11. #include <LibCore/File.h>
  12. namespace Audio {
  13. DSP::MDCT<12> MP3LoaderPlugin::s_mdct_12;
  14. DSP::MDCT<36> MP3LoaderPlugin::s_mdct_36;
  15. MP3LoaderPlugin::MP3LoaderPlugin(NonnullOwnPtr<SeekableStream> stream)
  16. : LoaderPlugin(move(stream))
  17. {
  18. }
  19. Result<NonnullOwnPtr<MP3LoaderPlugin>, LoaderError> MP3LoaderPlugin::create(StringView path)
  20. {
  21. auto stream = LOADER_TRY(Core::BufferedFile::create(LOADER_TRY(Core::File::open(path, Core::File::OpenMode::Read))));
  22. auto loader = make<MP3LoaderPlugin>(move(stream));
  23. LOADER_TRY(loader->initialize());
  24. return loader;
  25. }
  26. Result<NonnullOwnPtr<MP3LoaderPlugin>, LoaderError> MP3LoaderPlugin::create(Bytes buffer)
  27. {
  28. auto stream = LOADER_TRY(try_make<FixedMemoryStream>(buffer));
  29. auto loader = make<MP3LoaderPlugin>(move(stream));
  30. LOADER_TRY(loader->initialize());
  31. return loader;
  32. }
  33. MaybeLoaderError MP3LoaderPlugin::initialize()
  34. {
  35. m_bitstream = LOADER_TRY(try_make<BigEndianInputBitStream>(MaybeOwned<Stream>(*m_stream)));
  36. TRY(synchronize());
  37. auto header = TRY(read_header());
  38. if (header.id != 1 || header.layer != 3)
  39. return LoaderError { LoaderError::Category::Format, "Only MPEG-1 layer 3 supported." };
  40. m_sample_rate = header.samplerate;
  41. m_num_channels = header.channel_count();
  42. m_loaded_samples = 0;
  43. TRY(build_seek_table());
  44. LOADER_TRY(m_stream->seek(0, SeekMode::SetPosition));
  45. return {};
  46. }
  47. MaybeLoaderError MP3LoaderPlugin::reset()
  48. {
  49. TRY(seek(0));
  50. m_current_frame = {};
  51. m_synthesis_buffer = {};
  52. m_loaded_samples = 0;
  53. LOADER_TRY(m_bit_reservoir.discard(m_bit_reservoir.used_buffer_size()));
  54. m_bitstream->align_to_byte_boundary();
  55. return {};
  56. }
  57. MaybeLoaderError MP3LoaderPlugin::seek(int const position)
  58. {
  59. for (auto const& seek_entry : m_seek_table) {
  60. if (seek_entry.get<1>() >= position) {
  61. LOADER_TRY(m_stream->seek(seek_entry.get<0>(), SeekMode::SetPosition));
  62. m_loaded_samples = seek_entry.get<1>();
  63. break;
  64. }
  65. }
  66. m_current_frame = {};
  67. m_synthesis_buffer = {};
  68. LOADER_TRY(m_bit_reservoir.discard(m_bit_reservoir.used_buffer_size()));
  69. m_bitstream->align_to_byte_boundary();
  70. return {};
  71. }
  72. ErrorOr<Vector<FixedArray<Sample>>, LoaderError> MP3LoaderPlugin::load_chunks(size_t samples_to_read_from_input)
  73. {
  74. int samples_to_read = samples_to_read_from_input;
  75. Vector<FixedArray<Sample>> frames;
  76. while (samples_to_read > 0) {
  77. FixedArray<Sample> samples = LOADER_TRY(FixedArray<Sample>::create(MP3::frame_size));
  78. if (!m_current_frame.has_value()) {
  79. auto maybe_frame = read_next_frame();
  80. if (maybe_frame.is_error()) {
  81. if (m_stream->is_eof()) {
  82. return Vector<FixedArray<Sample>> {};
  83. }
  84. return maybe_frame.release_error();
  85. }
  86. m_current_frame = maybe_frame.release_value();
  87. if (!m_current_frame.has_value())
  88. break;
  89. }
  90. bool const is_stereo = m_current_frame->header.channel_count() == 2;
  91. size_t current_frame_read = 0;
  92. for (; current_frame_read < MP3::granule_size; current_frame_read++) {
  93. auto const left_sample = m_current_frame->channels[0].granules[0].pcm[current_frame_read / 32][current_frame_read % 32];
  94. auto const right_sample = is_stereo ? m_current_frame->channels[1].granules[0].pcm[current_frame_read / 32][current_frame_read % 32] : left_sample;
  95. samples[current_frame_read] = Sample { left_sample, right_sample };
  96. samples_to_read--;
  97. }
  98. for (; current_frame_read < MP3::frame_size; current_frame_read++) {
  99. auto const left_sample = m_current_frame->channels[0].granules[1].pcm[(current_frame_read - MP3::granule_size) / 32][(current_frame_read - MP3::granule_size) % 32];
  100. auto const right_sample = is_stereo ? m_current_frame->channels[1].granules[1].pcm[(current_frame_read - MP3::granule_size) / 32][(current_frame_read - MP3::granule_size) % 32] : left_sample;
  101. samples[current_frame_read] = Sample { left_sample, right_sample };
  102. samples_to_read--;
  103. }
  104. m_loaded_samples += samples.size();
  105. TRY(frames.try_append(move(samples)));
  106. m_current_frame = {};
  107. }
  108. return frames;
  109. }
  110. MaybeLoaderError MP3LoaderPlugin::build_seek_table()
  111. {
  112. int sample_count = 0;
  113. size_t frame_count = 0;
  114. m_seek_table.clear();
  115. m_bitstream->align_to_byte_boundary();
  116. while (!synchronize().is_error()) {
  117. auto const frame_pos = -2 + LOADER_TRY(m_stream->seek(0, SeekMode::FromCurrentPosition));
  118. auto error_or_header = read_header();
  119. if (error_or_header.is_error() || error_or_header.value().id != 1 || error_or_header.value().layer != 3) {
  120. continue;
  121. }
  122. frame_count++;
  123. sample_count += MP3::frame_size;
  124. if (frame_count % 10 == 0)
  125. m_seek_table.append({ frame_pos, sample_count });
  126. LOADER_TRY(m_stream->seek(error_or_header.value().frame_size - 6, SeekMode::FromCurrentPosition));
  127. // TODO: This is just here to clear the bitstream buffer.
  128. // Bitstream should have a method to sync its state to the underlying stream.
  129. m_bitstream->align_to_byte_boundary();
  130. }
  131. m_total_samples = sample_count;
  132. return {};
  133. }
  134. ErrorOr<MP3::Header, LoaderError> MP3LoaderPlugin::read_header()
  135. {
  136. MP3::Header header;
  137. header.id = LOADER_TRY(m_bitstream->read_bit());
  138. header.layer = MP3::Tables::LayerNumberLookup[LOADER_TRY(m_bitstream->read_bits(2))];
  139. if (header.layer <= 0)
  140. return LoaderError { LoaderError::Category::Format, m_loaded_samples, "Frame header contains invalid layer number." };
  141. header.protection_bit = LOADER_TRY(m_bitstream->read_bit());
  142. header.bitrate = MP3::Tables::BitratesPerLayerLookup[header.layer - 1][LOADER_TRY(m_bitstream->read_bits(4))];
  143. if (header.bitrate <= 0)
  144. return LoaderError { LoaderError::Category::Format, m_loaded_samples, "Frame header contains invalid bitrate." };
  145. header.samplerate = MP3::Tables::SampleratesLookup[LOADER_TRY(m_bitstream->read_bits(2))];
  146. if (header.samplerate <= 0)
  147. return LoaderError { LoaderError::Category::Format, m_loaded_samples, "Frame header contains invalid samplerate." };
  148. header.padding_bit = LOADER_TRY(m_bitstream->read_bit());
  149. header.private_bit = LOADER_TRY(m_bitstream->read_bit());
  150. header.mode = static_cast<MP3::Mode>(LOADER_TRY(m_bitstream->read_bits(2)));
  151. header.mode_extension = static_cast<MP3::ModeExtension>(LOADER_TRY(m_bitstream->read_bits(2)));
  152. header.copyright_bit = LOADER_TRY(m_bitstream->read_bit());
  153. header.original_bit = LOADER_TRY(m_bitstream->read_bit());
  154. header.emphasis = static_cast<MP3::Emphasis>(LOADER_TRY(m_bitstream->read_bits(2)));
  155. if (!header.protection_bit)
  156. header.crc16 = LOADER_TRY(m_bitstream->read_bits<u16>(16));
  157. header.frame_size = 144 * header.bitrate * 1000 / header.samplerate + header.padding_bit;
  158. header.slot_count = header.frame_size - ((header.channel_count() == 2 ? 32 : 17) + (header.protection_bit ? 0 : 2) + 4);
  159. return header;
  160. }
  161. MaybeLoaderError MP3LoaderPlugin::synchronize()
  162. {
  163. size_t one_counter = 0;
  164. while (one_counter < 12 && !m_bitstream->is_eof()) {
  165. bool const bit = LOADER_TRY(m_bitstream->read_bit());
  166. one_counter = bit ? one_counter + 1 : 0;
  167. if (!bit) {
  168. m_bitstream->align_to_byte_boundary();
  169. }
  170. }
  171. if (one_counter != 12)
  172. return LoaderError { LoaderError::Category::Format, m_loaded_samples, "Failed to synchronize." };
  173. return {};
  174. }
  175. ErrorOr<MP3::MP3Frame, LoaderError> MP3LoaderPlugin::read_next_frame()
  176. {
  177. // Note: This will spin until we find a correct frame, or we reach eof.
  178. // In the second case, the error will bubble up from read_frame_data().
  179. while (true) {
  180. TRY(synchronize());
  181. MP3::Header header = TRY(read_header());
  182. if (header.id != 1 || header.layer != 3) {
  183. continue;
  184. }
  185. return read_frame_data(header);
  186. }
  187. }
  188. ErrorOr<MP3::MP3Frame, LoaderError> MP3LoaderPlugin::read_frame_data(MP3::Header const& header)
  189. {
  190. MP3::MP3Frame frame { header };
  191. TRY(read_side_information(frame));
  192. auto maybe_buffer = ByteBuffer::create_uninitialized(header.slot_count);
  193. if (maybe_buffer.is_error())
  194. return LoaderError { LoaderError::Category::IO, m_loaded_samples, "Out of memory" };
  195. auto& buffer = maybe_buffer.value();
  196. size_t old_reservoir_size = m_bit_reservoir.used_buffer_size();
  197. LOADER_TRY(m_bitstream->read_entire_buffer(buffer));
  198. // FIXME: This should write the entire span.
  199. if (LOADER_TRY(m_bit_reservoir.write_some(buffer)) != header.slot_count)
  200. return LoaderError { LoaderError::Category::IO, m_loaded_samples, "Could not write frame into bit reservoir." };
  201. // If we don't have enough data in the reservoir to process this frame, skip it (but keep the data).
  202. if (old_reservoir_size < static_cast<size_t>(frame.main_data_begin))
  203. return frame;
  204. TRY(m_bit_reservoir.discard(old_reservoir_size - frame.main_data_begin));
  205. BigEndianInputBitStream reservoir_stream { MaybeOwned<Stream>(m_bit_reservoir) };
  206. for (size_t granule_index = 0; granule_index < 2; granule_index++) {
  207. for (size_t channel_index = 0; channel_index < header.channel_count(); channel_index++) {
  208. size_t scale_factor_size = TRY(read_scale_factors(frame, reservoir_stream, granule_index, channel_index));
  209. TRY(read_huffman_data(frame, reservoir_stream, granule_index, channel_index, scale_factor_size));
  210. if (frame.channels[channel_index].granules[granule_index].block_type == MP3::BlockType::Short) {
  211. reorder_samples(frame.channels[channel_index].granules[granule_index], frame.header.samplerate);
  212. // Only reduce alias for lowest 2 bands as they're long.
  213. // Afaik this is not mentioned in the ISO spec, but it is addressed in the
  214. // changelog for the ISO compliance tests.
  215. if (frame.channels[channel_index].granules[granule_index].mixed_block_flag)
  216. reduce_alias(frame.channels[channel_index].granules[granule_index], 36);
  217. } else {
  218. reduce_alias(frame.channels[channel_index].granules[granule_index]);
  219. }
  220. }
  221. if (header.mode == MP3::Mode::JointStereo) {
  222. process_stereo(frame, granule_index);
  223. }
  224. }
  225. for (size_t granule_index = 0; granule_index < 2; granule_index++) {
  226. for (size_t channel_index = 0; channel_index < header.channel_count(); channel_index++) {
  227. auto& granule = frame.channels[channel_index].granules[granule_index];
  228. for (size_t i = 0; i < MP3::granule_size; i += 18) {
  229. MP3::BlockType block_type = granule.block_type;
  230. if (i < 36 && granule.mixed_block_flag) {
  231. // ISO/IEC 11172-3: if mixed_block_flag is set, the lowest two subbands are transformed with normal window.
  232. block_type = MP3::BlockType::Normal;
  233. }
  234. Array<float, 36> output;
  235. transform_samples_to_time(granule.samples, i, output, block_type);
  236. int const subband_index = i / 18;
  237. for (size_t sample_index = 0; sample_index < 18; sample_index++) {
  238. // overlap add
  239. granule.filter_bank_input[subband_index][sample_index] = output[sample_index] + m_last_values[channel_index][subband_index][sample_index];
  240. m_last_values[channel_index][subband_index][sample_index] = output[sample_index + 18];
  241. // frequency inversion
  242. if (subband_index % 2 == 1 && sample_index % 2 == 1)
  243. granule.filter_bank_input[subband_index][sample_index] *= -1;
  244. }
  245. }
  246. }
  247. }
  248. Array<float, 32> in_samples;
  249. for (size_t channel_index = 0; channel_index < frame.header.channel_count(); channel_index++) {
  250. for (size_t granule_index = 0; granule_index < 2; granule_index++) {
  251. auto& granule = frame.channels[channel_index].granules[granule_index];
  252. for (size_t sample_index = 0; sample_index < 18; sample_index++) {
  253. for (size_t band_index = 0; band_index < 32; band_index++) {
  254. in_samples[band_index] = granule.filter_bank_input[band_index][sample_index];
  255. }
  256. synthesis(m_synthesis_buffer[channel_index], in_samples, granule.pcm[sample_index]);
  257. }
  258. }
  259. }
  260. return frame;
  261. }
  262. MaybeLoaderError MP3LoaderPlugin::read_side_information(MP3::MP3Frame& frame)
  263. {
  264. frame.main_data_begin = LOADER_TRY(m_bitstream->read_bits(9));
  265. if (frame.header.channel_count() == 1) {
  266. frame.private_bits = LOADER_TRY(m_bitstream->read_bits(5));
  267. } else {
  268. frame.private_bits = LOADER_TRY(m_bitstream->read_bits(3));
  269. }
  270. for (size_t channel_index = 0; channel_index < frame.header.channel_count(); channel_index++) {
  271. for (size_t scale_factor_selection_info_band = 0; scale_factor_selection_info_band < 4; scale_factor_selection_info_band++) {
  272. frame.channels[channel_index].scale_factor_selection_info[scale_factor_selection_info_band] = LOADER_TRY(m_bitstream->read_bit());
  273. }
  274. }
  275. for (size_t granule_index = 0; granule_index < 2; granule_index++) {
  276. for (size_t channel_index = 0; channel_index < frame.header.channel_count(); channel_index++) {
  277. auto& granule = frame.channels[channel_index].granules[granule_index];
  278. granule.part_2_3_length = LOADER_TRY(m_bitstream->read_bits(12));
  279. granule.big_values = LOADER_TRY(m_bitstream->read_bits(9));
  280. granule.global_gain = LOADER_TRY(m_bitstream->read_bits(8));
  281. granule.scalefac_compress = LOADER_TRY(m_bitstream->read_bits(4));
  282. granule.window_switching_flag = LOADER_TRY(m_bitstream->read_bit());
  283. if (granule.window_switching_flag) {
  284. granule.block_type = static_cast<MP3::BlockType>(LOADER_TRY(m_bitstream->read_bits(2)));
  285. granule.mixed_block_flag = LOADER_TRY(m_bitstream->read_bit());
  286. for (size_t region = 0; region < 2; region++)
  287. granule.table_select[region] = LOADER_TRY(m_bitstream->read_bits(5));
  288. for (size_t window = 0; window < 3; window++)
  289. granule.sub_block_gain[window] = LOADER_TRY(m_bitstream->read_bits(3));
  290. granule.region0_count = (granule.block_type == MP3::BlockType::Short && !granule.mixed_block_flag) ? 8 : 7;
  291. granule.region1_count = 36;
  292. } else {
  293. for (size_t region = 0; region < 3; region++)
  294. granule.table_select[region] = LOADER_TRY(m_bitstream->read_bits(5));
  295. granule.region0_count = LOADER_TRY(m_bitstream->read_bits(4));
  296. granule.region1_count = LOADER_TRY(m_bitstream->read_bits(3));
  297. }
  298. granule.preflag = LOADER_TRY(m_bitstream->read_bit());
  299. granule.scalefac_scale = LOADER_TRY(m_bitstream->read_bit());
  300. granule.count1table_select = LOADER_TRY(m_bitstream->read_bit());
  301. }
  302. }
  303. return {};
  304. }
  305. // From ISO/IEC 11172-3 (2.4.3.4.7.1)
  306. Array<float, MP3::granule_size> MP3LoaderPlugin::calculate_frame_exponents(MP3::MP3Frame const& frame, size_t granule_index, size_t channel_index)
  307. {
  308. Array<float, MP3::granule_size> exponents;
  309. auto fill_band = [&exponents](float exponent, size_t start, size_t end) {
  310. for (size_t j = start; j <= end; j++) {
  311. exponents[j] = exponent;
  312. }
  313. };
  314. auto const& channel = frame.channels[channel_index];
  315. auto const& granule = frame.channels[channel_index].granules[granule_index];
  316. auto const scale_factor_bands = get_scalefactor_bands(granule, frame.header.samplerate);
  317. float const scale_factor_multiplier = granule.scalefac_scale ? 1 : 0.5;
  318. int const gain = granule.global_gain - 210;
  319. if (granule.block_type != MP3::BlockType::Short) {
  320. for (size_t band_index = 0; band_index < 22; band_index++) {
  321. float const exponent = gain / 4.0f - (scale_factor_multiplier * (channel.scale_factors[band_index] + granule.preflag * MP3::Tables::Pretab[band_index]));
  322. fill_band(AK::pow<float>(2.0, exponent), scale_factor_bands[band_index].start, scale_factor_bands[band_index].end);
  323. }
  324. } else {
  325. size_t band_index = 0;
  326. size_t sample_count = 0;
  327. if (granule.mixed_block_flag) {
  328. while (sample_count < 36) {
  329. float const exponent = gain / 4.0f - (scale_factor_multiplier * (channel.scale_factors[band_index] + granule.preflag * MP3::Tables::Pretab[band_index]));
  330. fill_band(AK::pow<float>(2.0, exponent), scale_factor_bands[band_index].start, scale_factor_bands[band_index].end);
  331. sample_count += scale_factor_bands[band_index].width;
  332. band_index++;
  333. }
  334. }
  335. float const gain0 = (gain - 8 * granule.sub_block_gain[0]) / 4.0;
  336. float const gain1 = (gain - 8 * granule.sub_block_gain[1]) / 4.0;
  337. float const gain2 = (gain - 8 * granule.sub_block_gain[2]) / 4.0;
  338. while (sample_count < MP3::granule_size && band_index < scale_factor_bands.size()) {
  339. float const exponent0 = gain0 - (scale_factor_multiplier * channel.scale_factors[band_index + 0]);
  340. float const exponent1 = gain1 - (scale_factor_multiplier * channel.scale_factors[band_index + 1]);
  341. float const exponent2 = gain2 - (scale_factor_multiplier * channel.scale_factors[band_index + 2]);
  342. fill_band(AK::pow<float>(2.0, exponent0), scale_factor_bands[band_index + 0].start, scale_factor_bands[band_index + 0].end);
  343. sample_count += scale_factor_bands[band_index + 0].width;
  344. fill_band(AK::pow<float>(2.0, exponent1), scale_factor_bands[band_index + 1].start, scale_factor_bands[band_index + 1].end);
  345. sample_count += scale_factor_bands[band_index + 1].width;
  346. fill_band(AK::pow<float>(2.0, exponent2), scale_factor_bands[band_index + 2].start, scale_factor_bands[band_index + 2].end);
  347. sample_count += scale_factor_bands[band_index + 2].width;
  348. band_index += 3;
  349. }
  350. while (sample_count < MP3::granule_size)
  351. exponents[sample_count++] = 0;
  352. }
  353. return exponents;
  354. }
  355. ErrorOr<size_t, LoaderError> MP3LoaderPlugin::read_scale_factors(MP3::MP3Frame& frame, BigEndianInputBitStream& reservoir, size_t granule_index, size_t channel_index)
  356. {
  357. auto& channel = frame.channels[channel_index];
  358. auto const& granule = channel.granules[granule_index];
  359. size_t band_index = 0;
  360. size_t bits_read = 0;
  361. if (granule.window_switching_flag && granule.block_type == MP3::BlockType::Short) {
  362. if (granule.mixed_block_flag) {
  363. for (size_t i = 0; i < 8; i++) {
  364. auto const bits = MP3::Tables::ScalefacCompressSlen1[granule.scalefac_compress];
  365. channel.scale_factors[band_index++] = TRY(reservoir.read_bits(bits));
  366. bits_read += bits;
  367. }
  368. for (size_t i = 3; i < 12; i++) {
  369. auto const bits = i <= 5 ? MP3::Tables::ScalefacCompressSlen1[granule.scalefac_compress] : MP3::Tables::ScalefacCompressSlen2[granule.scalefac_compress];
  370. channel.scale_factors[band_index++] = TRY(reservoir.read_bits(bits));
  371. channel.scale_factors[band_index++] = TRY(reservoir.read_bits(bits));
  372. channel.scale_factors[band_index++] = TRY(reservoir.read_bits(bits));
  373. bits_read += 3 * bits;
  374. }
  375. } else {
  376. for (size_t i = 0; i < 12; i++) {
  377. auto const bits = i <= 5 ? MP3::Tables::ScalefacCompressSlen1[granule.scalefac_compress] : MP3::Tables::ScalefacCompressSlen2[granule.scalefac_compress];
  378. channel.scale_factors[band_index++] = TRY(reservoir.read_bits(bits));
  379. channel.scale_factors[band_index++] = TRY(reservoir.read_bits(bits));
  380. channel.scale_factors[band_index++] = TRY(reservoir.read_bits(bits));
  381. bits_read += 3 * bits;
  382. }
  383. }
  384. channel.scale_factors[band_index++] = 0;
  385. channel.scale_factors[band_index++] = 0;
  386. channel.scale_factors[band_index++] = 0;
  387. } else {
  388. if ((channel.scale_factor_selection_info[0] == 0) || (granule_index == 0)) {
  389. for (band_index = 0; band_index < 6; band_index++) {
  390. auto const bits = MP3::Tables::ScalefacCompressSlen1[granule.scalefac_compress];
  391. channel.scale_factors[band_index] = TRY(reservoir.read_bits(bits));
  392. bits_read += bits;
  393. }
  394. }
  395. if ((channel.scale_factor_selection_info[1] == 0) || (granule_index == 0)) {
  396. for (band_index = 6; band_index < 11; band_index++) {
  397. auto const bits = MP3::Tables::ScalefacCompressSlen1[granule.scalefac_compress];
  398. channel.scale_factors[band_index] = TRY(reservoir.read_bits(bits));
  399. bits_read += bits;
  400. }
  401. }
  402. if ((channel.scale_factor_selection_info[2] == 0) || (granule_index == 0)) {
  403. for (band_index = 11; band_index < 16; band_index++) {
  404. auto const bits = MP3::Tables::ScalefacCompressSlen2[granule.scalefac_compress];
  405. channel.scale_factors[band_index] = TRY(reservoir.read_bits(bits));
  406. bits_read += bits;
  407. }
  408. }
  409. if ((channel.scale_factor_selection_info[3] == 0) || (granule_index == 0)) {
  410. for (band_index = 16; band_index < 21; band_index++) {
  411. auto const bits = MP3::Tables::ScalefacCompressSlen2[granule.scalefac_compress];
  412. channel.scale_factors[band_index] = TRY(reservoir.read_bits(bits));
  413. bits_read += bits;
  414. }
  415. }
  416. channel.scale_factors[21] = 0;
  417. }
  418. return bits_read;
  419. }
  420. MaybeLoaderError MP3LoaderPlugin::read_huffman_data(MP3::MP3Frame& frame, BigEndianInputBitStream& reservoir, size_t granule_index, size_t channel_index, size_t granule_bits_read)
  421. {
  422. auto const exponents = calculate_frame_exponents(frame, granule_index, channel_index);
  423. auto& granule = frame.channels[channel_index].granules[granule_index];
  424. auto const scale_factor_bands = get_scalefactor_bands(granule, frame.header.samplerate);
  425. size_t const scale_factor_band_index1 = granule.region0_count + 1;
  426. size_t const scale_factor_band_index2 = min(scale_factor_bands.size() - 1, scale_factor_band_index1 + granule.region1_count + 1);
  427. bool const is_short_granule = granule.window_switching_flag && granule.block_type == MP3::BlockType::Short;
  428. size_t const region1_start = is_short_granule ? 36 : scale_factor_bands[scale_factor_band_index1].start;
  429. size_t const region2_start = is_short_granule ? MP3::granule_size : scale_factor_bands[scale_factor_band_index2].start;
  430. auto requantize = [](int const sample, float const exponent) -> float {
  431. int const sign = sample < 0 ? -1 : 1;
  432. int const magnitude = AK::abs(sample);
  433. return sign * AK::pow<float>(static_cast<float>(magnitude), 4 / 3.0) * exponent;
  434. };
  435. size_t count = 0;
  436. for (; count < granule.big_values * 2; count += 2) {
  437. MP3::Tables::Huffman::HuffmanTreeXY const* tree = nullptr;
  438. if (count < region1_start) {
  439. tree = &MP3::Tables::Huffman::HuffmanTreesXY[granule.table_select[0]];
  440. } else if (count < region2_start) {
  441. tree = &MP3::Tables::Huffman::HuffmanTreesXY[granule.table_select[1]];
  442. } else {
  443. tree = &MP3::Tables::Huffman::HuffmanTreesXY[granule.table_select[2]];
  444. }
  445. if (!tree || tree->nodes.is_empty()) {
  446. return LoaderError { LoaderError::Category::Format, m_loaded_samples, "Frame references invalid huffman table." };
  447. }
  448. // Assumption: There's enough bits to read. 32 is just a placeholder for "unlimited".
  449. // There are no 32 bit long huffman codes in the tables.
  450. auto const entry = MP3::Tables::Huffman::huffman_decode(reservoir, tree->nodes, 32);
  451. granule_bits_read += entry.bits_read;
  452. if (!entry.code.has_value())
  453. return LoaderError { LoaderError::Category::Format, m_loaded_samples, "Frame contains invalid huffman data." };
  454. int x = entry.code->symbol.x;
  455. int y = entry.code->symbol.y;
  456. if (x == 15 && tree->linbits > 0) {
  457. x += LOADER_TRY(reservoir.read_bits(tree->linbits));
  458. granule_bits_read += tree->linbits;
  459. }
  460. if (x != 0) {
  461. if (LOADER_TRY(reservoir.read_bit()))
  462. x = -x;
  463. granule_bits_read++;
  464. }
  465. if (y == 15 && tree->linbits > 0) {
  466. y += LOADER_TRY(reservoir.read_bits(tree->linbits));
  467. granule_bits_read += tree->linbits;
  468. }
  469. if (y != 0) {
  470. if (LOADER_TRY(reservoir.read_bit()))
  471. y = -y;
  472. granule_bits_read++;
  473. }
  474. granule.samples[count + 0] = requantize(x, exponents[count + 0]);
  475. granule.samples[count + 1] = requantize(y, exponents[count + 1]);
  476. }
  477. ReadonlySpan<MP3::Tables::Huffman::HuffmanNode<MP3::Tables::Huffman::HuffmanVWXY>> count1table = granule.count1table_select ? MP3::Tables::Huffman::TreeB : MP3::Tables::Huffman::TreeA;
  478. // count1 is not known. We have to read huffman encoded values
  479. // until we've exhausted the granule's bits. We know the size of
  480. // the granule from part2_3_length, which is the number of bits
  481. // used for scaleactors and huffman data (in the granule).
  482. while (granule_bits_read < granule.part_2_3_length && count <= MP3::granule_size - 4) {
  483. auto const entry = MP3::Tables::Huffman::huffman_decode(reservoir, count1table, granule.part_2_3_length - granule_bits_read);
  484. granule_bits_read += entry.bits_read;
  485. if (!entry.code.has_value())
  486. return LoaderError { LoaderError::Category::Format, m_loaded_samples, "Frame contains invalid huffman data." };
  487. int v = entry.code->symbol.v;
  488. if (v != 0) {
  489. if (granule_bits_read >= granule.part_2_3_length)
  490. break;
  491. if (LOADER_TRY(reservoir.read_bit()))
  492. v = -v;
  493. granule_bits_read++;
  494. }
  495. int w = entry.code->symbol.w;
  496. if (w != 0) {
  497. if (granule_bits_read >= granule.part_2_3_length)
  498. break;
  499. if (LOADER_TRY(reservoir.read_bit()))
  500. w = -w;
  501. granule_bits_read++;
  502. }
  503. int x = entry.code->symbol.x;
  504. if (x != 0) {
  505. if (granule_bits_read >= granule.part_2_3_length)
  506. break;
  507. if (LOADER_TRY(reservoir.read_bit()))
  508. x = -x;
  509. granule_bits_read++;
  510. }
  511. int y = entry.code->symbol.y;
  512. if (y != 0) {
  513. if (granule_bits_read >= granule.part_2_3_length)
  514. break;
  515. if (LOADER_TRY(reservoir.read_bit()))
  516. y = -y;
  517. granule_bits_read++;
  518. }
  519. granule.samples[count + 0] = requantize(v, exponents[count + 0]);
  520. granule.samples[count + 1] = requantize(w, exponents[count + 1]);
  521. granule.samples[count + 2] = requantize(x, exponents[count + 2]);
  522. granule.samples[count + 3] = requantize(y, exponents[count + 3]);
  523. count += 4;
  524. }
  525. if (granule_bits_read > granule.part_2_3_length) {
  526. return LoaderError { LoaderError::Category::Format, m_loaded_samples, "Read too many bits from bit reservoir." };
  527. }
  528. for (size_t i = granule_bits_read; i < granule.part_2_3_length; i++) {
  529. LOADER_TRY(reservoir.read_bit());
  530. }
  531. return {};
  532. }
  533. void MP3LoaderPlugin::reorder_samples(MP3::Granule& granule, u32 sample_rate)
  534. {
  535. float tmp[MP3::granule_size] = {};
  536. size_t band_index = 0;
  537. size_t subband_index = 0;
  538. auto scale_factor_bands = get_scalefactor_bands(granule, sample_rate);
  539. if (granule.mixed_block_flag) {
  540. while (subband_index < 36) {
  541. for (size_t frequency_line_index = 0; frequency_line_index < scale_factor_bands[band_index].width; frequency_line_index++) {
  542. tmp[subband_index] = granule.samples[subband_index];
  543. subband_index++;
  544. }
  545. band_index++;
  546. }
  547. }
  548. while (subband_index < MP3::granule_size && band_index <= 36) {
  549. for (size_t frequency_line_index = 0; frequency_line_index < scale_factor_bands[band_index].width; frequency_line_index++) {
  550. tmp[subband_index++] = granule.samples[scale_factor_bands[band_index + 0].start + frequency_line_index];
  551. tmp[subband_index++] = granule.samples[scale_factor_bands[band_index + 1].start + frequency_line_index];
  552. tmp[subband_index++] = granule.samples[scale_factor_bands[band_index + 2].start + frequency_line_index];
  553. }
  554. band_index += 3;
  555. }
  556. for (size_t i = 0; i < MP3::granule_size; i++)
  557. granule.samples[i] = tmp[i];
  558. }
  559. void MP3LoaderPlugin::reduce_alias(MP3::Granule& granule, size_t max_subband_index)
  560. {
  561. for (size_t subband = 0; subband < max_subband_index - 18; subband += 18) {
  562. for (size_t i = 0; i < 8; i++) {
  563. size_t const idx1 = subband + 17 - i;
  564. size_t const idx2 = subband + 18 + i;
  565. auto const d1 = granule.samples[idx1];
  566. auto const d2 = granule.samples[idx2];
  567. granule.samples[idx1] = d1 * MP3::Tables::AliasReductionCs[i] - d2 * MP3::Tables::AliasReductionCa[i];
  568. granule.samples[idx2] = d2 * MP3::Tables::AliasReductionCs[i] + d1 * MP3::Tables::AliasReductionCa[i];
  569. }
  570. }
  571. }
  572. void MP3LoaderPlugin::process_stereo(MP3::MP3Frame& frame, size_t granule_index)
  573. {
  574. size_t band_index_ms_start = 0;
  575. size_t band_index_ms_end = 0;
  576. size_t band_index_intensity_start = 0;
  577. size_t band_index_intensity_end = 0;
  578. auto& granule_left = frame.channels[0].granules[granule_index];
  579. auto& granule_right = frame.channels[1].granules[granule_index];
  580. auto get_last_nonempty_band = [](Span<float> samples, ReadonlySpan<MP3::Tables::ScaleFactorBand> bands) -> size_t {
  581. size_t last_nonempty_band = 0;
  582. for (size_t i = 0; i < bands.size(); i++) {
  583. bool is_empty = true;
  584. for (size_t l = bands[i].start; l < bands[i].end; l++) {
  585. if (samples[l] != 0) {
  586. is_empty = false;
  587. break;
  588. }
  589. }
  590. if (!is_empty)
  591. last_nonempty_band = i;
  592. }
  593. return last_nonempty_band;
  594. };
  595. auto process_ms_stereo = [&](MP3::Tables::ScaleFactorBand const& band) {
  596. float const SQRT_2 = AK::sqrt(2.0);
  597. for (size_t i = band.start; i <= band.end; i++) {
  598. float const m = granule_left.samples[i];
  599. float const s = granule_right.samples[i];
  600. granule_left.samples[i] = (m + s) / SQRT_2;
  601. granule_right.samples[i] = (m - s) / SQRT_2;
  602. }
  603. };
  604. auto process_intensity_stereo = [&](MP3::Tables::ScaleFactorBand const& band, float intensity_stereo_ratio) {
  605. for (size_t i = band.start; i <= band.end; i++) {
  606. float const sample_left = granule_left.samples[i];
  607. float const coeff_l = intensity_stereo_ratio / (1 + intensity_stereo_ratio);
  608. float const coeff_r = 1 / (1 + intensity_stereo_ratio);
  609. granule_left.samples[i] = sample_left * coeff_l;
  610. granule_right.samples[i] = sample_left * coeff_r;
  611. }
  612. };
  613. auto scale_factor_bands = get_scalefactor_bands(granule_right, frame.header.samplerate);
  614. if (has_flag(frame.header.mode_extension, MP3::ModeExtension::MsStereo)) {
  615. band_index_ms_start = 0;
  616. band_index_ms_end = scale_factor_bands.size();
  617. }
  618. if (has_flag(frame.header.mode_extension, MP3::ModeExtension::IntensityStereo)) {
  619. band_index_intensity_start = get_last_nonempty_band(granule_right.samples, scale_factor_bands);
  620. band_index_intensity_end = scale_factor_bands.size();
  621. band_index_ms_end = band_index_intensity_start;
  622. }
  623. for (size_t band_index = band_index_ms_start; band_index < band_index_ms_end; band_index++) {
  624. process_ms_stereo(scale_factor_bands[band_index]);
  625. }
  626. for (size_t band_index = band_index_intensity_start; band_index < band_index_intensity_end; band_index++) {
  627. auto const intensity_stereo_position = frame.channels[1].scale_factors[band_index];
  628. if (intensity_stereo_position == 7) {
  629. if (has_flag(frame.header.mode_extension, MP3::ModeExtension::MsStereo))
  630. process_ms_stereo(scale_factor_bands[band_index]);
  631. continue;
  632. }
  633. float const intensity_stereo_ratio = AK::tan(intensity_stereo_position * AK::Pi<float> / 12);
  634. process_intensity_stereo(scale_factor_bands[band_index], intensity_stereo_ratio);
  635. }
  636. }
  637. void MP3LoaderPlugin::transform_samples_to_time(Array<float, MP3::granule_size> const& input, size_t input_offset, Array<float, 36>& output, MP3::BlockType block_type)
  638. {
  639. if (block_type == MP3::BlockType::Short) {
  640. size_t const N = 12;
  641. Array<float, N * 3> temp_out;
  642. Array<float, N / 2> temp_in;
  643. for (size_t k = 0; k < N / 2; k++)
  644. temp_in[k] = input[input_offset + 3 * k + 0];
  645. s_mdct_12.transform(temp_in, Span<float>(temp_out).slice(0, N));
  646. for (size_t i = 0; i < N; i++)
  647. temp_out[i + 0] *= MP3::Tables::WindowBlockTypeShort[i];
  648. for (size_t k = 0; k < N / 2; k++)
  649. temp_in[k] = input[input_offset + 3 * k + 1];
  650. s_mdct_12.transform(temp_in, Span<float>(temp_out).slice(12, N));
  651. for (size_t i = 0; i < N; i++)
  652. temp_out[i + 12] *= MP3::Tables::WindowBlockTypeShort[i];
  653. for (size_t k = 0; k < N / 2; k++)
  654. temp_in[k] = input[input_offset + 3 * k + 2];
  655. s_mdct_12.transform(temp_in, Span<float>(temp_out).slice(24, N));
  656. for (size_t i = 0; i < N; i++)
  657. temp_out[i + 24] *= MP3::Tables::WindowBlockTypeShort[i];
  658. Span<float> idmct1 = Span<float>(temp_out).slice(0, 12);
  659. Span<float> idmct2 = Span<float>(temp_out).slice(12, 12);
  660. Span<float> idmct3 = Span<float>(temp_out).slice(24, 12);
  661. for (size_t i = 0; i < 6; i++)
  662. output[i] = 0;
  663. for (size_t i = 6; i < 12; i++)
  664. output[i] = idmct1[i - 6];
  665. for (size_t i = 12; i < 18; i++)
  666. output[i] = idmct1[i - 6] + idmct2[i - 12];
  667. for (size_t i = 18; i < 24; i++)
  668. output[i] = idmct2[i - 12] + idmct3[i - 18];
  669. for (size_t i = 24; i < 30; i++)
  670. output[i] = idmct3[i - 18];
  671. for (size_t i = 30; i < 36; i++)
  672. output[i] = 0;
  673. } else {
  674. s_mdct_36.transform(ReadonlySpan<float>(input).slice(input_offset, 18), output);
  675. for (size_t i = 0; i < 36; i++) {
  676. switch (block_type) {
  677. case MP3::BlockType::Normal:
  678. output[i] *= MP3::Tables::WindowBlockTypeNormal[i];
  679. break;
  680. case MP3::BlockType::Start:
  681. output[i] *= MP3::Tables::WindowBlockTypeStart[i];
  682. break;
  683. case MP3::BlockType::End:
  684. output[i] *= MP3::Tables::WindowBlockTypeEnd[i];
  685. break;
  686. case MP3::BlockType::Short:
  687. VERIFY_NOT_REACHED();
  688. break;
  689. }
  690. }
  691. }
  692. }
  693. // ISO/IEC 11172-3 (Figure A.2)
  694. void MP3LoaderPlugin::synthesis(Array<float, 1024>& V, Array<float, 32>& samples, Array<float, 32>& result)
  695. {
  696. for (size_t i = 1023; i >= 64; i--) {
  697. V[i] = V[i - 64];
  698. }
  699. for (size_t i = 0; i < 64; i++) {
  700. V[i] = 0;
  701. for (size_t k = 0; k < 32; k++) {
  702. float const N = MP3::Tables::SynthesisSubbandFilterCoefficients[i][k];
  703. V[i] += N * samples[k];
  704. }
  705. }
  706. Array<float, 512> U;
  707. for (size_t i = 0; i < 8; i++) {
  708. for (size_t j = 0; j < 32; j++) {
  709. U[i * 64 + j] = V[i * 128 + j];
  710. U[i * 64 + 32 + j] = V[i * 128 + 96 + j];
  711. }
  712. }
  713. Array<float, 512> W;
  714. for (size_t i = 0; i < 512; i++) {
  715. W[i] = U[i] * MP3::Tables::WindowSynthesis[i];
  716. }
  717. for (size_t j = 0; j < 32; j++) {
  718. result[j] = 0;
  719. for (size_t k = 0; k < 16; k++) {
  720. result[j] += W[j + 32 * k];
  721. }
  722. }
  723. }
  724. ReadonlySpan<MP3::Tables::ScaleFactorBand> MP3LoaderPlugin::get_scalefactor_bands(MP3::Granule const& granule, int samplerate)
  725. {
  726. switch (granule.block_type) {
  727. case MP3::BlockType::Short:
  728. switch (samplerate) {
  729. case 32000:
  730. return granule.mixed_block_flag ? MP3::Tables::ScaleFactorBandMixed32000 : MP3::Tables::ScaleFactorBandShort32000;
  731. case 44100:
  732. return granule.mixed_block_flag ? MP3::Tables::ScaleFactorBandMixed44100 : MP3::Tables::ScaleFactorBandShort44100;
  733. case 48000:
  734. return granule.mixed_block_flag ? MP3::Tables::ScaleFactorBandMixed48000 : MP3::Tables::ScaleFactorBandShort48000;
  735. }
  736. break;
  737. case MP3::BlockType::Normal:
  738. [[fallthrough]];
  739. case MP3::BlockType::Start:
  740. [[fallthrough]];
  741. case MP3::BlockType::End:
  742. switch (samplerate) {
  743. case 32000:
  744. return MP3::Tables::ScaleFactorBandLong32000;
  745. case 44100:
  746. return MP3::Tables::ScaleFactorBandLong44100;
  747. case 48000:
  748. return MP3::Tables::ScaleFactorBandLong48000;
  749. }
  750. }
  751. VERIFY_NOT_REACHED();
  752. }
  753. }