// Copyright (c) 2012 The Chromium Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. #include "base/basictypes.h" #include "base/logging.h" #include "base/memory/scoped_ptr.h" #include "media/mp4/box_definitions.h" #include "media/mp4/rcheck.h" #include "media/mp4/track_run_iterator.h" #include "testing/gtest/include/gtest/gtest.h" // The sum of the elements in a vector initialized with SumAscending, // less the value of the last element. static const int kSumAscending1 = 45; static const int kAudioScale = 48000; static const int kVideoScale = 25; static const uint32 kSampleIsDifferenceSampleFlagMask = 0x10000; static const uint8 kAuxInfo[] = { 0x41, 0x54, 0x65, 0x73, 0x74, 0x49, 0x76, 0x31, 0x41, 0x54, 0x65, 0x73, 0x74, 0x49, 0x76, 0x32, 0x00, 0x02, 0x00, 0x01, 0x00, 0x00, 0x00, 0x02, 0x00, 0x03, 0x00, 0x00, 0x00, 0x04 }; static const char kIv1[] = { 0x41, 0x54, 0x65, 0x73, 0x74, 0x49, 0x76, 0x31, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00 }; static const uint8 kKeyId[] = { 0x41, 0x47, 0x6f, 0x6f, 0x67, 0x6c, 0x65, 0x54, 0x65, 0x73, 0x74, 0x4b, 0x65, 0x79, 0x49, 0x44 }; namespace media { namespace mp4 { class TrackRunIteratorTest : public testing::Test { public: TrackRunIteratorTest() { CreateMovie(); } protected: Movie moov_; LogCB log_cb_; scoped_ptr iter_; void CreateMovie() { moov_.header.timescale = 1000; moov_.tracks.resize(3); moov_.extends.tracks.resize(2); moov_.tracks[0].header.track_id = 1; moov_.tracks[0].media.header.timescale = kAudioScale; SampleDescription& desc1 = moov_.tracks[0].media.information.sample_table.description; AudioSampleEntry aud_desc; aud_desc.format = FOURCC_MP4A; aud_desc.sinf.info.track_encryption.is_encrypted = false; desc1.type = kAudio; desc1.audio_entries.push_back(aud_desc); moov_.extends.tracks[0].track_id = 1; moov_.extends.tracks[0].default_sample_description_index = 1; moov_.tracks[1].header.track_id = 2; moov_.tracks[1].media.header.timescale = kVideoScale; SampleDescription& desc2 = moov_.tracks[1].media.information.sample_table.description; VideoSampleEntry vid_desc; vid_desc.format = FOURCC_AVC1; vid_desc.sinf.info.track_encryption.is_encrypted = false; desc2.type = kVideo; desc2.video_entries.push_back(vid_desc); moov_.extends.tracks[1].track_id = 2; moov_.extends.tracks[1].default_sample_description_index = 1; moov_.tracks[2].header.track_id = 3; moov_.tracks[2].media.information.sample_table.description.type = kHint; } MovieFragment CreateFragment() { MovieFragment moof; moof.tracks.resize(2); moof.tracks[0].decode_time.decode_time = 0; moof.tracks[0].header.track_id = 1; moof.tracks[0].header.has_default_sample_flags = true; moof.tracks[0].header.default_sample_duration = 1024; moof.tracks[0].header.default_sample_size = 4; moof.tracks[0].runs.resize(2); moof.tracks[0].runs[0].sample_count = 10; moof.tracks[0].runs[0].data_offset = 100; SetAscending(&moof.tracks[0].runs[0].sample_sizes); moof.tracks[0].runs[1].sample_count = 10; moof.tracks[0].runs[1].data_offset = 10000; moof.tracks[1].header.track_id = 2; moof.tracks[1].header.has_default_sample_flags = false; moof.tracks[1].decode_time.decode_time = 10; moof.tracks[1].runs.resize(1); moof.tracks[1].runs[0].sample_count = 10; moof.tracks[1].runs[0].data_offset = 200; SetAscending(&moof.tracks[1].runs[0].sample_sizes); SetAscending(&moof.tracks[1].runs[0].sample_durations); moof.tracks[1].runs[0].sample_flags.resize(10); for (size_t i = 1; i < moof.tracks[1].runs[0].sample_flags.size(); i++) { moof.tracks[1].runs[0].sample_flags[i] = kSampleIsDifferenceSampleFlagMask; } return moof; } // Update the first sample description of a Track to indicate encryption void AddEncryption(Track* track) { SampleDescription* stsd = &track->media.information.sample_table.description; ProtectionSchemeInfo* sinf; if (!stsd->video_entries.empty()) { sinf = &stsd->video_entries[0].sinf; } else { sinf = &stsd->audio_entries[0].sinf; } sinf->type.type = FOURCC_CENC; sinf->info.track_encryption.is_encrypted = true; sinf->info.track_encryption.default_iv_size = 8; sinf->info.track_encryption.default_kid.insert( sinf->info.track_encryption.default_kid.begin(), kKeyId, kKeyId + arraysize(kKeyId)); } // Add aux info covering the first track run to a TrackFragment, and update // the run to ensure it matches length and subsample information. void AddAuxInfoHeaders(int offset, TrackFragment* frag) { frag->auxiliary_offset.offsets.push_back(offset); frag->auxiliary_size.sample_count = 2; frag->auxiliary_size.sample_info_sizes.push_back(8); frag->auxiliary_size.sample_info_sizes.push_back(22); frag->runs[0].sample_count = 2; frag->runs[0].sample_sizes[1] = 10; } void SetAscending(std::vector* vec) { vec->resize(10); for (size_t i = 0; i < vec->size(); i++) (*vec)[i] = i+1; } }; TEST_F(TrackRunIteratorTest, NoRunsTest) { iter_.reset(new TrackRunIterator(&moov_, log_cb_)); ASSERT_TRUE(iter_->Init(MovieFragment())); EXPECT_FALSE(iter_->IsRunValid()); EXPECT_FALSE(iter_->IsSampleValid()); } TEST_F(TrackRunIteratorTest, BasicOperationTest) { iter_.reset(new TrackRunIterator(&moov_, log_cb_)); MovieFragment moof = CreateFragment(); // Test that runs are sorted correctly, and that properties of the initial // sample of the first run are correct ASSERT_TRUE(iter_->Init(moof)); EXPECT_TRUE(iter_->IsRunValid()); EXPECT_FALSE(iter_->is_encrypted()); EXPECT_EQ(iter_->track_id(), 1u); EXPECT_EQ(iter_->sample_offset(), 100); EXPECT_EQ(iter_->sample_size(), 1); EXPECT_EQ(iter_->dts(), TimeDeltaFromRational(0, kAudioScale)); EXPECT_EQ(iter_->cts(), TimeDeltaFromRational(0, kAudioScale)); EXPECT_EQ(iter_->duration(), TimeDeltaFromRational(1024, kAudioScale)); EXPECT_TRUE(iter_->is_keyframe()); // Advance to the last sample in the current run, and test its properties for (int i = 0; i < 9; i++) iter_->AdvanceSample(); EXPECT_EQ(iter_->track_id(), 1u); EXPECT_EQ(iter_->sample_offset(), 100 + kSumAscending1); EXPECT_EQ(iter_->sample_size(), 10); EXPECT_EQ(iter_->dts(), TimeDeltaFromRational(1024 * 9, kAudioScale)); EXPECT_EQ(iter_->duration(), TimeDeltaFromRational(1024, kAudioScale)); EXPECT_TRUE(iter_->is_keyframe()); // Test end-of-run iter_->AdvanceSample(); EXPECT_FALSE(iter_->IsSampleValid()); // Test last sample of next run iter_->AdvanceRun(); EXPECT_TRUE(iter_->is_keyframe()); for (int i = 0; i < 9; i++) iter_->AdvanceSample(); EXPECT_EQ(iter_->track_id(), 2u); EXPECT_EQ(iter_->sample_offset(), 200 + kSumAscending1); EXPECT_EQ(iter_->sample_size(), 10); int64 base_dts = kSumAscending1 + moof.tracks[1].decode_time.decode_time; EXPECT_EQ(iter_->dts(), TimeDeltaFromRational(base_dts, kVideoScale)); EXPECT_EQ(iter_->duration(), TimeDeltaFromRational(10, kVideoScale)); EXPECT_FALSE(iter_->is_keyframe()); // Test final run iter_->AdvanceRun(); EXPECT_EQ(iter_->track_id(), 1u); EXPECT_EQ(iter_->dts(), TimeDeltaFromRational(1024 * 10, kAudioScale)); iter_->AdvanceSample(); EXPECT_EQ(moof.tracks[0].runs[1].data_offset + moof.tracks[0].header.default_sample_size, iter_->sample_offset()); iter_->AdvanceRun(); EXPECT_FALSE(iter_->IsRunValid()); } TEST_F(TrackRunIteratorTest, TrackExtendsDefaultsTest) { moov_.extends.tracks[0].default_sample_duration = 50; moov_.extends.tracks[0].default_sample_size = 3; moov_.extends.tracks[0].default_sample_flags = kSampleIsDifferenceSampleFlagMask; iter_.reset(new TrackRunIterator(&moov_, log_cb_)); MovieFragment moof = CreateFragment(); moof.tracks[0].header.has_default_sample_flags = false; moof.tracks[0].header.default_sample_size = 0; moof.tracks[0].header.default_sample_duration = 0; moof.tracks[0].runs[0].sample_sizes.clear(); ASSERT_TRUE(iter_->Init(moof)); iter_->AdvanceSample(); EXPECT_FALSE(iter_->is_keyframe()); EXPECT_EQ(iter_->sample_size(), 3); EXPECT_EQ(iter_->sample_offset(), moof.tracks[0].runs[0].data_offset + 3); EXPECT_EQ(iter_->duration(), TimeDeltaFromRational(50, kAudioScale)); EXPECT_EQ(iter_->dts(), TimeDeltaFromRational(50, kAudioScale)); } TEST_F(TrackRunIteratorTest, FirstSampleFlagTest) { // Ensure that keyframes are flagged correctly in the face of BMFF boxes which // explicitly specify the flags for the first sample in a run and rely on // defaults for all subsequent samples iter_.reset(new TrackRunIterator(&moov_, log_cb_)); MovieFragment moof = CreateFragment(); moof.tracks[1].header.has_default_sample_flags = true; moof.tracks[1].header.default_sample_flags = kSampleIsDifferenceSampleFlagMask; moof.tracks[1].runs[0].sample_flags.resize(1); ASSERT_TRUE(iter_->Init(moof)); iter_->AdvanceRun(); EXPECT_TRUE(iter_->is_keyframe()); iter_->AdvanceSample(); EXPECT_FALSE(iter_->is_keyframe()); } TEST_F(TrackRunIteratorTest, MinDecodeTest) { iter_.reset(new TrackRunIterator(&moov_, log_cb_)); MovieFragment moof = CreateFragment(); moof.tracks[0].decode_time.decode_time = kAudioScale; ASSERT_TRUE(iter_->Init(moof)); EXPECT_EQ(TimeDeltaFromRational(moof.tracks[1].decode_time.decode_time, kVideoScale), iter_->GetMinDecodeTimestamp()); } TEST_F(TrackRunIteratorTest, ReorderingTest) { // Test frame reordering and edit list support. The frames have the following // decode timestamps: // // 0ms 40ms 120ms 240ms // | 0 | 1 - | 2 - - | // // ...and these composition timestamps, after edit list adjustment: // // 0ms 40ms 160ms 240ms // | 0 | 2 - - | 1 - | // Create an edit list with one entry, with an initial start time of 80ms // (that is, 2 / kVideoTimescale) and a duration of zero (which is treated as // infinite according to 14496-12:2012). This will cause the first 80ms of the // media timeline - which will be empty, due to CTS biasing - to be discarded. iter_.reset(new TrackRunIterator(&moov_, log_cb_)); EditListEntry entry; entry.segment_duration = 0; entry.media_time = 2; entry.media_rate_integer = 1; entry.media_rate_fraction = 0; moov_.tracks[1].edit.list.edits.push_back(entry); // Add CTS offsets. Without bias, the CTS offsets for the first three frames // would simply be [0, 3, -2]. Since CTS offsets should be non-negative for // maximum compatibility, these values are biased up to [2, 5, 0], and the // extra 80ms is removed via the edit list. MovieFragment moof = CreateFragment(); std::vector& cts_offsets = moof.tracks[1].runs[0].sample_composition_time_offsets; cts_offsets.resize(10); cts_offsets[0] = 2; cts_offsets[1] = 5; cts_offsets[2] = 0; moof.tracks[1].decode_time.decode_time = 0; ASSERT_TRUE(iter_->Init(moof)); iter_->AdvanceRun(); EXPECT_EQ(iter_->dts(), TimeDeltaFromRational(0, kVideoScale)); EXPECT_EQ(iter_->cts(), TimeDeltaFromRational(0, kVideoScale)); EXPECT_EQ(iter_->duration(), TimeDeltaFromRational(1, kVideoScale)); iter_->AdvanceSample(); EXPECT_EQ(iter_->dts(), TimeDeltaFromRational(1, kVideoScale)); EXPECT_EQ(iter_->cts(), TimeDeltaFromRational(4, kVideoScale)); EXPECT_EQ(iter_->duration(), TimeDeltaFromRational(2, kVideoScale)); iter_->AdvanceSample(); EXPECT_EQ(iter_->dts(), TimeDeltaFromRational(3, kVideoScale)); EXPECT_EQ(iter_->cts(), TimeDeltaFromRational(1, kVideoScale)); EXPECT_EQ(iter_->duration(), TimeDeltaFromRational(3, kVideoScale)); } TEST_F(TrackRunIteratorTest, IgnoreUnknownAuxInfoTest) { iter_.reset(new TrackRunIterator(&moov_, log_cb_)); MovieFragment moof = CreateFragment(); moof.tracks[1].auxiliary_offset.offsets.push_back(50); moof.tracks[1].auxiliary_size.default_sample_info_size = 2; moof.tracks[1].auxiliary_size.sample_count = 2; moof.tracks[1].runs[0].sample_count = 2; ASSERT_TRUE(iter_->Init(moof)); iter_->AdvanceRun(); EXPECT_FALSE(iter_->AuxInfoNeedsToBeCached()); } TEST_F(TrackRunIteratorTest, DecryptConfigTest) { AddEncryption(&moov_.tracks[1]); iter_.reset(new TrackRunIterator(&moov_, log_cb_)); MovieFragment moof = CreateFragment(); AddAuxInfoHeaders(50, &moof.tracks[1]); ASSERT_TRUE(iter_->Init(moof)); // The run for track 2 will be first, since its aux info offset is the first // element in the file. EXPECT_EQ(iter_->track_id(), 2u); EXPECT_TRUE(iter_->is_encrypted()); EXPECT_TRUE(iter_->AuxInfoNeedsToBeCached()); EXPECT_EQ(static_cast(iter_->aux_info_size()), arraysize(kAuxInfo)); EXPECT_EQ(iter_->aux_info_offset(), 50); EXPECT_EQ(iter_->GetMaxClearOffset(), 50); EXPECT_FALSE(iter_->CacheAuxInfo(NULL, 0)); EXPECT_FALSE(iter_->CacheAuxInfo(kAuxInfo, 3)); EXPECT_TRUE(iter_->AuxInfoNeedsToBeCached()); EXPECT_TRUE(iter_->CacheAuxInfo(kAuxInfo, arraysize(kAuxInfo))); EXPECT_FALSE(iter_->AuxInfoNeedsToBeCached()); EXPECT_EQ(iter_->sample_offset(), 200); EXPECT_EQ(iter_->GetMaxClearOffset(), moof.tracks[0].runs[0].data_offset); scoped_ptr config = iter_->GetDecryptConfig(); ASSERT_EQ(arraysize(kKeyId), config->key_id().size()); EXPECT_TRUE(!memcmp(kKeyId, config->key_id().data(), config->key_id().size())); ASSERT_EQ(arraysize(kIv1), config->iv().size()); EXPECT_TRUE(!memcmp(kIv1, config->iv().data(), config->iv().size())); EXPECT_TRUE(config->subsamples().empty()); iter_->AdvanceSample(); config = iter_->GetDecryptConfig(); EXPECT_EQ(config->subsamples().size(), 2u); EXPECT_EQ(config->subsamples()[0].clear_bytes, 1u); EXPECT_EQ(config->subsamples()[1].cypher_bytes, 4u); } // It is legal for aux info blocks to be shared among multiple formats. TEST_F(TrackRunIteratorTest, SharedAuxInfoTest) { AddEncryption(&moov_.tracks[0]); AddEncryption(&moov_.tracks[1]); iter_.reset(new TrackRunIterator(&moov_, log_cb_)); MovieFragment moof = CreateFragment(); moof.tracks[0].runs.resize(1); AddAuxInfoHeaders(50, &moof.tracks[0]); AddAuxInfoHeaders(50, &moof.tracks[1]); moof.tracks[0].auxiliary_size.default_sample_info_size = 8; ASSERT_TRUE(iter_->Init(moof)); EXPECT_EQ(iter_->track_id(), 1u); EXPECT_EQ(iter_->aux_info_offset(), 50); EXPECT_TRUE(iter_->CacheAuxInfo(kAuxInfo, arraysize(kAuxInfo))); scoped_ptr config = iter_->GetDecryptConfig(); ASSERT_EQ(arraysize(kIv1), config->iv().size()); EXPECT_TRUE(!memcmp(kIv1, config->iv().data(), config->iv().size())); iter_->AdvanceSample(); EXPECT_EQ(iter_->GetMaxClearOffset(), 50); iter_->AdvanceRun(); EXPECT_EQ(iter_->GetMaxClearOffset(), 50); EXPECT_EQ(iter_->aux_info_offset(), 50); EXPECT_TRUE(iter_->CacheAuxInfo(kAuxInfo, arraysize(kAuxInfo))); EXPECT_EQ(iter_->GetMaxClearOffset(), 200); ASSERT_EQ(arraysize(kIv1), config->iv().size()); EXPECT_TRUE(!memcmp(kIv1, config->iv().data(), config->iv().size())); iter_->AdvanceSample(); EXPECT_EQ(iter_->GetMaxClearOffset(), 201); } // Sensible files are expected to place auxiliary information for a run // immediately before the main data for that run. Alternative schemes are // possible, however, including the somewhat reasonable behavior of placing all // aux info at the head of the 'mdat' box together, and the completely // unreasonable behavior demonstrated here: // byte 50: track 2, run 1 aux info // byte 100: track 1, run 1 data // byte 200: track 2, run 1 data // byte 201: track 1, run 2 aux info (*inside* track 2, run 1 data) // byte 10000: track 1, run 2 data // byte 20000: track 1, run 1 aux info TEST_F(TrackRunIteratorTest, UnexpectedOrderingTest) { AddEncryption(&moov_.tracks[0]); AddEncryption(&moov_.tracks[1]); iter_.reset(new TrackRunIterator(&moov_, log_cb_)); MovieFragment moof = CreateFragment(); AddAuxInfoHeaders(20000, &moof.tracks[0]); moof.tracks[0].auxiliary_offset.offsets.push_back(201); moof.tracks[0].auxiliary_size.sample_count += 2; moof.tracks[0].auxiliary_size.default_sample_info_size = 8; moof.tracks[0].runs[1].sample_count = 2; AddAuxInfoHeaders(50, &moof.tracks[1]); moof.tracks[1].runs[0].sample_sizes[0] = 5; ASSERT_TRUE(iter_->Init(moof)); EXPECT_EQ(iter_->track_id(), 2u); EXPECT_EQ(iter_->aux_info_offset(), 50); EXPECT_EQ(iter_->sample_offset(), 200); EXPECT_TRUE(iter_->CacheAuxInfo(kAuxInfo, arraysize(kAuxInfo))); EXPECT_EQ(iter_->GetMaxClearOffset(), 100); iter_->AdvanceRun(); EXPECT_EQ(iter_->track_id(), 1u); EXPECT_EQ(iter_->aux_info_offset(), 20000); EXPECT_EQ(iter_->sample_offset(), 100); EXPECT_TRUE(iter_->CacheAuxInfo(kAuxInfo, arraysize(kAuxInfo))); EXPECT_EQ(iter_->GetMaxClearOffset(), 100); iter_->AdvanceSample(); EXPECT_EQ(iter_->GetMaxClearOffset(), 101); iter_->AdvanceRun(); EXPECT_EQ(iter_->track_id(), 1u); EXPECT_EQ(iter_->aux_info_offset(), 201); EXPECT_EQ(iter_->sample_offset(), 10000); EXPECT_EQ(iter_->GetMaxClearOffset(), 201); EXPECT_TRUE(iter_->CacheAuxInfo(kAuxInfo, arraysize(kAuxInfo))); EXPECT_EQ(iter_->GetMaxClearOffset(), 10000); } } // namespace mp4 } // namespace media