/* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*- */ /* vim:set ts=2 sw=2 sts=2 et cindent: */ /* This Source Code Form is subject to the terms of the Mozilla Public * License, v. 2.0. If a copy of the MPL was not distributed with this * file, You can obtain one at http://mozilla.org/MPL/2.0/. */ #include "nsError.h" #include "MediaDecoderStateMachine.h" #include "AbstractMediaDecoder.h" #include "MediaResource.h" #include "WebMReader.h" #include "WebMBufferedParser.h" #include "mozilla/dom/TimeRanges.h" #include "VorbisUtils.h" #include "gfx2DGlue.h" #include #define VPX_DONT_DEFINE_STDINT_TYPES #include "vpx/vp8dx.h" #include "vpx/vpx_decoder.h" #include "OggReader.h" using mozilla::NesteggPacketHolder; template <> class nsAutoRefTraits : public nsPointerRefTraits { public: static void Release(NesteggPacketHolder* aHolder) { delete aHolder; } }; namespace mozilla { using namespace gfx; using namespace layers; // Un-comment to enable logging of seek bisections. //#define SEEK_LOGGING #ifdef PR_LOGGING extern PRLogModuleInfo* gMediaDecoderLog; PRLogModuleInfo* gNesteggLog; #define LOG(type, msg) PR_LOG(gMediaDecoderLog, type, msg) #ifdef SEEK_LOGGING #define SEEK_LOG(type, msg) PR_LOG(gMediaDecoderLog, type, msg) #else #define SEEK_LOG(type, msg) #endif #else #define LOG(type, msg) #define SEEK_LOG(type, msg) #endif static const unsigned NS_PER_USEC = 1000; static const double NS_PER_S = 1e9; // Functions for reading and seeking using MediaResource required for // nestegg_io. The 'user data' passed to these functions is the // decoder from which the media resource is obtained. static int webm_read(void *aBuffer, size_t aLength, void *aUserData) { NS_ASSERTION(aUserData, "aUserData must point to a valid AbstractMediaDecoder"); AbstractMediaDecoder* decoder = reinterpret_cast(aUserData); MediaResource* resource = decoder->GetResource(); NS_ASSERTION(resource, "Decoder has no media resource"); nsresult rv = NS_OK; bool eof = false; char *p = static_cast(aBuffer); while (NS_SUCCEEDED(rv) && aLength > 0) { uint32_t bytes = 0; rv = resource->Read(p, aLength, &bytes); if (bytes == 0) { eof = true; break; } aLength -= bytes; p += bytes; } return NS_FAILED(rv) ? -1 : eof ? 0 : 1; } static int webm_seek(int64_t aOffset, int aWhence, void *aUserData) { NS_ASSERTION(aUserData, "aUserData must point to a valid AbstractMediaDecoder"); AbstractMediaDecoder* decoder = reinterpret_cast(aUserData); MediaResource* resource = decoder->GetResource(); NS_ASSERTION(resource, "Decoder has no media resource"); nsresult rv = resource->Seek(aWhence, aOffset); return NS_SUCCEEDED(rv) ? 0 : -1; } static int64_t webm_tell(void *aUserData) { NS_ASSERTION(aUserData, "aUserData must point to a valid AbstractMediaDecoder"); AbstractMediaDecoder* decoder = reinterpret_cast(aUserData); MediaResource* resource = decoder->GetResource(); NS_ASSERTION(resource, "Decoder has no media resource"); return resource->Tell(); } static void webm_log(nestegg * context, unsigned int severity, char const * format, ...) { #ifdef PR_LOGGING va_list args; char msg[256]; const char * sevStr; switch(severity) { case NESTEGG_LOG_DEBUG: sevStr = "DBG"; break; case NESTEGG_LOG_INFO: sevStr = "INF"; break; case NESTEGG_LOG_WARNING: sevStr = "WRN"; break; case NESTEGG_LOG_ERROR: sevStr = "ERR"; break; case NESTEGG_LOG_CRITICAL: sevStr = "CRT"; break; default: sevStr = "UNK"; break; } va_start(args, format); PR_snprintf(msg, sizeof(msg), "%p [Nestegg-%s] ", context, sevStr); PR_vsnprintf(msg+strlen(msg), sizeof(msg)-strlen(msg), format, args); PR_LOG(gNesteggLog, PR_LOG_DEBUG, (msg)); va_end(args); #endif } WebMReader::WebMReader(AbstractMediaDecoder* aDecoder) : MediaDecoderReader(aDecoder), mContext(nullptr), mPacketCount(0), mChannels(0), #ifdef MOZ_OPUS mOpusParser(nullptr), mOpusDecoder(nullptr), mSkip(0), mSeekPreroll(0), #endif mVideoTrack(0), mAudioTrack(0), mAudioStartUsec(-1), mAudioFrames(0), mHasVideo(false), mHasAudio(false) { MOZ_COUNT_CTOR(WebMReader); #ifdef PR_LOGGING if (!gNesteggLog) { gNesteggLog = PR_NewLogModule("Nestegg"); } #endif // Zero these member vars to avoid crashes in VP8 destroy and Vorbis clear // functions when destructor is called before |Init|. memset(&mVPX, 0, sizeof(vpx_codec_ctx_t)); memset(&mVorbisBlock, 0, sizeof(vorbis_block)); memset(&mVorbisDsp, 0, sizeof(vorbis_dsp_state)); memset(&mVorbisInfo, 0, sizeof(vorbis_info)); memset(&mVorbisComment, 0, sizeof(vorbis_comment)); } WebMReader::~WebMReader() { Cleanup(); mVideoPackets.Reset(); mAudioPackets.Reset(); vpx_codec_destroy(&mVPX); vorbis_block_clear(&mVorbisBlock); vorbis_dsp_clear(&mVorbisDsp); vorbis_info_clear(&mVorbisInfo); vorbis_comment_clear(&mVorbisComment); if (mOpusDecoder) { opus_multistream_decoder_destroy(mOpusDecoder); mOpusDecoder = nullptr; } MOZ_COUNT_DTOR(WebMReader); } nsresult WebMReader::Init(MediaDecoderReader* aCloneDonor) { vorbis_info_init(&mVorbisInfo); vorbis_comment_init(&mVorbisComment); memset(&mVorbisDsp, 0, sizeof(vorbis_dsp_state)); memset(&mVorbisBlock, 0, sizeof(vorbis_block)); if (aCloneDonor) { mBufferedState = static_cast(aCloneDonor)->mBufferedState; } else { mBufferedState = new WebMBufferedState; } return NS_OK; } nsresult WebMReader::ResetDecode() { mAudioFrames = 0; mAudioStartUsec = -1; nsresult res = NS_OK; if (NS_FAILED(MediaDecoderReader::ResetDecode())) { res = NS_ERROR_FAILURE; } if (mAudioCodec == NESTEGG_CODEC_VORBIS) { // Ignore failed results from vorbis_synthesis_restart. They // aren't fatal and it fails when ResetDecode is called at a // time when no vorbis data has been read. vorbis_synthesis_restart(&mVorbisDsp); #ifdef MOZ_OPUS } else if (mAudioCodec == NESTEGG_CODEC_OPUS) { if (mOpusDecoder) { // Reset the decoder. opus_multistream_decoder_ctl(mOpusDecoder, OPUS_RESET_STATE); mSkip = mOpusParser->mPreSkip; } #endif } mVideoPackets.Reset(); mAudioPackets.Reset(); return res; } void WebMReader::Cleanup() { if (mContext) { nestegg_destroy(mContext); mContext = nullptr; } } nsresult WebMReader::ReadMetadata(MediaInfo* aInfo, MetadataTags** aTags) { NS_ASSERTION(mDecoder->OnDecodeThread(), "Should be on decode thread."); nestegg_io io; io.read = webm_read; io.seek = webm_seek; io.tell = webm_tell; io.userdata = mDecoder; int64_t maxOffset = -1; int r = nestegg_init(&mContext, io, &webm_log, maxOffset); if (r == -1) { return NS_ERROR_FAILURE; } uint64_t duration = 0; r = nestegg_duration(mContext, &duration); if (r == 0) { ReentrantMonitorAutoEnter mon(mDecoder->GetReentrantMonitor()); mDecoder->SetMediaDuration(duration / NS_PER_USEC); } unsigned int ntracks = 0; r = nestegg_track_count(mContext, &ntracks); if (r == -1) { Cleanup(); return NS_ERROR_FAILURE; } for (uint32_t track = 0; track < ntracks; ++track) { int id = nestegg_track_codec_id(mContext, track); if (id == -1) { Cleanup(); return NS_ERROR_FAILURE; } int type = nestegg_track_type(mContext, track); if (!mHasVideo && type == NESTEGG_TRACK_VIDEO) { nestegg_video_params params; r = nestegg_track_video_params(mContext, track, ¶ms); if (r == -1) { Cleanup(); return NS_ERROR_FAILURE; } vpx_codec_iface_t* dx = nullptr; mVideoCodec = nestegg_track_codec_id(mContext, track); if (mVideoCodec == NESTEGG_CODEC_VP8) { dx = vpx_codec_vp8_dx(); } else if (mVideoCodec == NESTEGG_CODEC_VP9) { dx = vpx_codec_vp9_dx(); } if (!dx || vpx_codec_dec_init(&mVPX, dx, nullptr, 0)) { Cleanup(); return NS_ERROR_FAILURE; } // Picture region, taking into account cropping, before scaling // to the display size. nsIntRect pictureRect(params.crop_left, params.crop_top, params.width - (params.crop_right + params.crop_left), params.height - (params.crop_bottom + params.crop_top)); // If the cropping data appears invalid then use the frame data if (pictureRect.width <= 0 || pictureRect.height <= 0 || pictureRect.x < 0 || pictureRect.y < 0) { pictureRect.x = 0; pictureRect.y = 0; pictureRect.width = params.width; pictureRect.height = params.height; } // Validate the container-reported frame and pictureRect sizes. This ensures // that our video frame creation code doesn't overflow. nsIntSize displaySize(params.display_width, params.display_height); nsIntSize frameSize(params.width, params.height); if (!IsValidVideoRegion(frameSize, pictureRect, displaySize)) { // Video track's frame sizes will overflow. Ignore the video track. continue; } mVideoTrack = track; mHasVideo = true; mInfo.mVideo.mHasVideo = true; mInfo.mVideo.mDisplay = displaySize; mPicture = pictureRect; mInitialFrame = frameSize; switch (params.stereo_mode) { case NESTEGG_VIDEO_MONO: mInfo.mVideo.mStereoMode = StereoMode::MONO; break; case NESTEGG_VIDEO_STEREO_LEFT_RIGHT: mInfo.mVideo.mStereoMode = StereoMode::LEFT_RIGHT; break; case NESTEGG_VIDEO_STEREO_BOTTOM_TOP: mInfo.mVideo.mStereoMode = StereoMode::BOTTOM_TOP; break; case NESTEGG_VIDEO_STEREO_TOP_BOTTOM: mInfo.mVideo.mStereoMode = StereoMode::TOP_BOTTOM; break; case NESTEGG_VIDEO_STEREO_RIGHT_LEFT: mInfo.mVideo.mStereoMode = StereoMode::RIGHT_LEFT; break; } } else if (!mHasAudio && type == NESTEGG_TRACK_AUDIO) { nestegg_audio_params params; r = nestegg_track_audio_params(mContext, track, ¶ms); if (r == -1) { Cleanup(); return NS_ERROR_FAILURE; } mAudioTrack = track; mHasAudio = true; mInfo.mAudio.mHasAudio = true; mAudioCodec = nestegg_track_codec_id(mContext, track); mCodecDelay = params.codec_delay / NS_PER_USEC; if (mAudioCodec == NESTEGG_CODEC_VORBIS) { // Get the Vorbis header data unsigned int nheaders = 0; r = nestegg_track_codec_data_count(mContext, track, &nheaders); if (r == -1 || nheaders != 3) { Cleanup(); return NS_ERROR_FAILURE; } for (uint32_t header = 0; header < nheaders; ++header) { unsigned char* data = 0; size_t length = 0; r = nestegg_track_codec_data(mContext, track, header, &data, &length); if (r == -1) { Cleanup(); return NS_ERROR_FAILURE; } ogg_packet opacket = InitOggPacket(data, length, header == 0, false, 0); r = vorbis_synthesis_headerin(&mVorbisInfo, &mVorbisComment, &opacket); if (r != 0) { Cleanup(); return NS_ERROR_FAILURE; } } r = vorbis_synthesis_init(&mVorbisDsp, &mVorbisInfo); if (r != 0) { Cleanup(); return NS_ERROR_FAILURE; } r = vorbis_block_init(&mVorbisDsp, &mVorbisBlock); if (r != 0) { Cleanup(); return NS_ERROR_FAILURE; } mInfo.mAudio.mRate = mVorbisDsp.vi->rate; mInfo.mAudio.mChannels = mVorbisDsp.vi->channels; mChannels = mInfo.mAudio.mChannels; #ifdef MOZ_OPUS } else if (mAudioCodec == NESTEGG_CODEC_OPUS) { unsigned char* data = 0; size_t length = 0; r = nestegg_track_codec_data(mContext, track, 0, &data, &length); if (r == -1) { Cleanup(); return NS_ERROR_FAILURE; } mOpusParser = new OpusParser; if (!mOpusParser->DecodeHeader(data, length)) { Cleanup(); return NS_ERROR_FAILURE; } if (!InitOpusDecoder()) { Cleanup(); return NS_ERROR_FAILURE; } if (static_cast(mCodecDelay) != FramesToUsecs(mOpusParser->mPreSkip, mOpusParser->mRate).value()) { LOG(PR_LOG_WARNING, ("Invalid Opus header: CodecDelay and pre-skip do not match!\n")); Cleanup(); return NS_ERROR_FAILURE; } mInfo.mAudio.mRate = mOpusParser->mRate; mInfo.mAudio.mChannels = mOpusParser->mChannels; mChannels = mInfo.mAudio.mChannels; mSeekPreroll = params.seek_preroll; #endif } else { Cleanup(); return NS_ERROR_FAILURE; } } } // We can't seek in buffered regions if we have no cues. mDecoder->SetMediaSeekable(nestegg_has_cues(mContext) == 1); *aInfo = mInfo; *aTags = nullptr; return NS_OK; } #ifdef MOZ_OPUS bool WebMReader::InitOpusDecoder() { int r; NS_ASSERTION(mOpusDecoder == nullptr, "leaking OpusDecoder"); mOpusDecoder = opus_multistream_decoder_create(mOpusParser->mRate, mOpusParser->mChannels, mOpusParser->mStreams, mOpusParser->mCoupledStreams, mOpusParser->mMappingTable, &r); mSkip = mOpusParser->mPreSkip; return r == OPUS_OK; } #endif ogg_packet WebMReader::InitOggPacket(unsigned char* aData, size_t aLength, bool aBOS, bool aEOS, int64_t aGranulepos) { ogg_packet packet; packet.packet = aData; packet.bytes = aLength; packet.b_o_s = aBOS; packet.e_o_s = aEOS; packet.granulepos = aGranulepos; packet.packetno = mPacketCount++; return packet; } bool WebMReader::DecodeAudioPacket(nestegg_packet* aPacket, int64_t aOffset) { NS_ASSERTION(mDecoder->OnDecodeThread(), "Should be on decode thread."); int r = 0; unsigned int count = 0; r = nestegg_packet_count(aPacket, &count); if (r == -1) { return false; } uint64_t tstamp = 0; r = nestegg_packet_tstamp(aPacket, &tstamp); if (r == -1) { return false; } const uint32_t rate = mInfo.mAudio.mRate; uint64_t tstamp_usecs = tstamp / NS_PER_USEC; if (mAudioStartUsec == -1) { // This is the first audio chunk. Assume the start time of our decode // is the start of this chunk. mAudioStartUsec = tstamp_usecs; } // If there's a gap between the start of this audio chunk and the end of // the previous audio chunk, we need to increment the packet count so that // the vorbis decode doesn't use data from before the gap to help decode // from after the gap. CheckedInt64 tstamp_frames = UsecsToFrames(tstamp_usecs, rate); CheckedInt64 decoded_frames = UsecsToFrames(mAudioStartUsec, rate); if (!tstamp_frames.isValid() || !decoded_frames.isValid()) { NS_WARNING("Int overflow converting WebM times to frames"); return false; } decoded_frames += mAudioFrames; if (!decoded_frames.isValid()) { NS_WARNING("Int overflow adding decoded_frames"); return false; } if (tstamp_frames.value() > decoded_frames.value()) { #ifdef DEBUG CheckedInt64 usecs = FramesToUsecs(tstamp_frames.value() - decoded_frames.value(), rate); LOG(PR_LOG_DEBUG, ("WebMReader detected gap of %lld, %lld frames, in audio stream\n", usecs.isValid() ? usecs.value() : -1, tstamp_frames.value() - decoded_frames.value())); #endif mPacketCount++; mAudioStartUsec = tstamp_usecs; mAudioFrames = 0; } int32_t total_frames = 0; for (uint32_t i = 0; i < count; ++i) { unsigned char* data; size_t length; r = nestegg_packet_data(aPacket, i, &data, &length); if (r == -1) { return false; } if (mAudioCodec == NESTEGG_CODEC_VORBIS) { ogg_packet opacket = InitOggPacket(data, length, false, false, -1); if (vorbis_synthesis(&mVorbisBlock, &opacket) != 0) { return false; } if (vorbis_synthesis_blockin(&mVorbisDsp, &mVorbisBlock) != 0) { return false; } VorbisPCMValue** pcm = 0; int32_t frames = 0; while ((frames = vorbis_synthesis_pcmout(&mVorbisDsp, &pcm)) > 0) { nsAutoArrayPtr buffer(new AudioDataValue[frames * mChannels]); for (uint32_t j = 0; j < mChannels; ++j) { VorbisPCMValue* channel = pcm[j]; for (uint32_t i = 0; i < uint32_t(frames); ++i) { buffer[i*mChannels + j] = MOZ_CONVERT_VORBIS_SAMPLE(channel[i]); } } CheckedInt64 duration = FramesToUsecs(frames, rate); if (!duration.isValid()) { NS_WARNING("Int overflow converting WebM audio duration"); return false; } CheckedInt64 total_duration = FramesToUsecs(total_frames, rate); if (!total_duration.isValid()) { NS_WARNING("Int overflow converting WebM audio total_duration"); return false; } CheckedInt64 time = total_duration + tstamp_usecs; if (!time.isValid()) { NS_WARNING("Int overflow adding total_duration and tstamp_usecs"); nestegg_free_packet(aPacket); return false; }; total_frames += frames; AudioQueue().Push(new AudioData(aOffset, time.value(), duration.value(), frames, buffer.forget(), mChannels)); mAudioFrames += frames; if (vorbis_synthesis_read(&mVorbisDsp, frames) != 0) { return false; } } } else if (mAudioCodec == NESTEGG_CODEC_OPUS) { #ifdef MOZ_OPUS uint32_t channels = mOpusParser->mChannels; // Maximum value is 63*2880, so there's no chance of overflow. int32_t frames_number = opus_packet_get_nb_frames(data, length); if (frames_number <= 0) return false; // Invalid packet header. int32_t samples = opus_packet_get_samples_per_frame(data, (opus_int32) rate); int32_t frames = frames_number*samples; // A valid Opus packet must be between 2.5 and 120 ms long. if (frames < 120 || frames > 5760) return false; nsAutoArrayPtr buffer(new AudioDataValue[frames * channels]); // Decode to the appropriate sample type. #ifdef MOZ_SAMPLE_TYPE_FLOAT32 int ret = opus_multistream_decode_float(mOpusDecoder, data, length, buffer, frames, false); #else int ret = opus_multistream_decode(mOpusDecoder, data, length, buffer, frames, false); #endif if (ret < 0) return false; NS_ASSERTION(ret == frames, "Opus decoded too few audio samples"); CheckedInt64 startTime = tstamp_usecs; // Trim the initial frames while the decoder is settling. if (mSkip > 0) { int32_t skipFrames = std::min(mSkip, frames); if (skipFrames == frames) { // discard the whole packet mSkip -= frames; LOG(PR_LOG_DEBUG, ("Opus decoder skipping %d frames" " (whole packet)", frames)); return true; } int32_t keepFrames = frames - skipFrames; int samples = keepFrames * channels; nsAutoArrayPtr trimBuffer(new AudioDataValue[samples]); for (int i = 0; i < samples; i++) trimBuffer[i] = buffer[skipFrames*channels + i]; startTime = startTime + FramesToUsecs(skipFrames, rate); frames = keepFrames; buffer = trimBuffer; mSkip -= skipFrames; LOG(PR_LOG_DEBUG, ("Opus decoder skipping %d frames", skipFrames)); } int64_t discardPadding = 0; r = nestegg_packet_discard_padding(aPacket, &discardPadding); if (discardPadding > 0) { CheckedInt64 discardFrames = UsecsToFrames(discardPadding * NS_PER_USEC, rate); if (!discardFrames.isValid()) { NS_WARNING("Int overflow in DiscardPadding"); return false; } int32_t keepFrames = frames - discardFrames.value(); if (keepFrames > 0) { int samples = keepFrames * channels; nsAutoArrayPtr trimBuffer(new AudioDataValue[samples]); for (int i = 0; i < samples; i++) trimBuffer[i] = buffer[i]; frames = keepFrames; buffer = trimBuffer; } else { LOG(PR_LOG_DEBUG, ("Opus decoder discarding whole packet" " ( %d frames) as padding", frames)); return true; } } // Apply the header gain if one was specified. #ifdef MOZ_SAMPLE_TYPE_FLOAT32 if (mOpusParser->mGain != 1.0f) { float gain = mOpusParser->mGain; int samples = frames * channels; for (int i = 0; i < samples; i++) { buffer[i] *= gain; } } #else if (mOpusParser->mGain_Q16 != 65536) { int64_t gain_Q16 = mOpusParser->mGain_Q16; int samples = frames * channels; for (int i = 0; i < samples; i++) { int32_t val = static_cast((gain_Q16*buffer[i] + 32768)>>16); buffer[i] = static_cast(MOZ_CLIP_TO_15(val)); } } #endif // No channel mapping for more than 8 channels. if (channels > 8) { return false; } CheckedInt64 duration = FramesToUsecs(frames, rate); if (!duration.isValid()) { NS_WARNING("Int overflow converting WebM audio duration"); return false; } CheckedInt64 time = startTime - mCodecDelay; if (!time.isValid()) { NS_WARNING("Int overflow shifting tstamp by codec delay"); nestegg_free_packet(aPacket); return false; }; AudioQueue().Push(new AudioData(mDecoder->GetResource()->Tell(), time.value(), duration.value(), frames, buffer.forget(), mChannels)); mAudioFrames += frames; #else return false; #endif /* MOZ_OPUS */ } } return true; } nsReturnRef WebMReader::NextPacket(TrackType aTrackType) { // The packet queue that packets will be pushed on if they // are not the type we are interested in. WebMPacketQueue& otherPackets = aTrackType == VIDEO ? mAudioPackets : mVideoPackets; // The packet queue for the type that we are interested in. WebMPacketQueue &packets = aTrackType == VIDEO ? mVideoPackets : mAudioPackets; // Flag to indicate that we do need to playback these types of // packets. bool hasType = aTrackType == VIDEO ? mHasVideo : mHasAudio; // Flag to indicate that we do need to playback the other type // of track. bool hasOtherType = aTrackType == VIDEO ? mHasAudio : mHasVideo; // Track we are interested in uint32_t ourTrack = aTrackType == VIDEO ? mVideoTrack : mAudioTrack; // Value of other track uint32_t otherTrack = aTrackType == VIDEO ? mAudioTrack : mVideoTrack; nsAutoRef holder; if (packets.GetSize() > 0) { holder.own(packets.PopFront()); } else { // Keep reading packets until we find a packet // for the track we want. do { nestegg_packet* packet; int r = nestegg_read_packet(mContext, &packet); if (r <= 0) { return nsReturnRef(); } int64_t offset = mDecoder->GetResource()->Tell(); holder.own(new NesteggPacketHolder(packet, offset)); unsigned int track = 0; r = nestegg_packet_track(packet, &track); if (r == -1) { return nsReturnRef(); } if (hasOtherType && otherTrack == track) { // Save the packet for when we want these packets otherPackets.Push(holder.disown()); continue; } // The packet is for the track we want to play if (hasType && ourTrack == track) { break; } } while (true); } return holder.out(); } bool WebMReader::DecodeAudioData() { NS_ASSERTION(mDecoder->OnDecodeThread(), "Should be on decode thread."); nsAutoRef holder(NextPacket(AUDIO)); if (!holder) { return false; } return DecodeAudioPacket(holder->mPacket, holder->mOffset); } bool WebMReader::DecodeVideoFrame(bool &aKeyframeSkip, int64_t aTimeThreshold) { NS_ASSERTION(mDecoder->OnDecodeThread(), "Should be on decode thread."); // Record number of frames decoded and parsed. Automatically update the // stats counters using the AutoNotifyDecoded stack-based class. uint32_t parsed = 0, decoded = 0; AbstractMediaDecoder::AutoNotifyDecoded autoNotify(mDecoder, parsed, decoded); nsAutoRef holder(NextPacket(VIDEO)); if (!holder) { return false; } nestegg_packet* packet = holder->mPacket; unsigned int track = 0; int r = nestegg_packet_track(packet, &track); if (r == -1) { return false; } unsigned int count = 0; r = nestegg_packet_count(packet, &count); if (r == -1) { return false; } uint64_t tstamp = 0; r = nestegg_packet_tstamp(packet, &tstamp); if (r == -1) { return false; } // The end time of this frame is the start time of the next frame. Fetch // the timestamp of the next packet for this track. If we've reached the // end of the resource, use the file's duration as the end time of this // video frame. uint64_t next_tstamp = 0; { nsAutoRef next_holder(NextPacket(VIDEO)); if (next_holder) { r = nestegg_packet_tstamp(next_holder->mPacket, &next_tstamp); if (r == -1) { return false; } PushVideoPacket(next_holder.disown()); } else { ReentrantMonitorAutoEnter decoderMon(mDecoder->GetReentrantMonitor()); int64_t endTime = mDecoder->GetEndMediaTime(); if (endTime == -1) { return false; } next_tstamp = endTime * NS_PER_USEC; } } int64_t tstamp_usecs = tstamp / NS_PER_USEC; for (uint32_t i = 0; i < count; ++i) { unsigned char* data; size_t length; r = nestegg_packet_data(packet, i, &data, &length); if (r == -1) { return false; } vpx_codec_stream_info_t si; memset(&si, 0, sizeof(si)); si.sz = sizeof(si); if (mVideoCodec == NESTEGG_CODEC_VP8) { vpx_codec_peek_stream_info(vpx_codec_vp8_dx(), data, length, &si); } else if (mVideoCodec == NESTEGG_CODEC_VP9) { vpx_codec_peek_stream_info(vpx_codec_vp9_dx(), data, length, &si); } if (aKeyframeSkip && (!si.is_kf || tstamp_usecs < aTimeThreshold)) { // Skipping to next keyframe... parsed++; // Assume 1 frame per chunk. continue; } if (aKeyframeSkip && si.is_kf) { aKeyframeSkip = false; } if (vpx_codec_decode(&mVPX, data, length, nullptr, 0)) { return false; } // If the timestamp of the video frame is less than // the time threshold required then it is not added // to the video queue and won't be displayed. if (tstamp_usecs < aTimeThreshold) { parsed++; // Assume 1 frame per chunk. continue; } vpx_codec_iter_t iter = nullptr; vpx_image_t *img; while ((img = vpx_codec_get_frame(&mVPX, &iter))) { NS_ASSERTION(img->fmt == IMG_FMT_I420, "WebM image format is not I420"); // Chroma shifts are rounded down as per the decoding examples in the VP8 SDK VideoData::YCbCrBuffer b; b.mPlanes[0].mData = img->planes[0]; b.mPlanes[0].mStride = img->stride[0]; b.mPlanes[0].mHeight = img->d_h; b.mPlanes[0].mWidth = img->d_w; b.mPlanes[0].mOffset = b.mPlanes[0].mSkip = 0; b.mPlanes[1].mData = img->planes[1]; b.mPlanes[1].mStride = img->stride[1]; b.mPlanes[1].mHeight = (img->d_h + 1) >> img->y_chroma_shift; b.mPlanes[1].mWidth = (img->d_w + 1) >> img->x_chroma_shift; b.mPlanes[1].mOffset = b.mPlanes[1].mSkip = 0; b.mPlanes[2].mData = img->planes[2]; b.mPlanes[2].mStride = img->stride[2]; b.mPlanes[2].mHeight = (img->d_h + 1) >> img->y_chroma_shift; b.mPlanes[2].mWidth = (img->d_w + 1) >> img->x_chroma_shift; b.mPlanes[2].mOffset = b.mPlanes[2].mSkip = 0; IntRect picture = ToIntRect(mPicture); if (img->d_w != static_cast(mInitialFrame.width) || img->d_h != static_cast(mInitialFrame.height)) { // Frame size is different from what the container reports. This is legal // in WebM, and we will preserve the ratio of the crop rectangle as it // was reported relative to the picture size reported by the container. picture.x = (mPicture.x * img->d_w) / mInitialFrame.width; picture.y = (mPicture.y * img->d_h) / mInitialFrame.height; picture.width = (img->d_w * mPicture.width) / mInitialFrame.width; picture.height = (img->d_h * mPicture.height) / mInitialFrame.height; } VideoData *v = VideoData::Create(mInfo.mVideo, mDecoder->GetImageContainer(), holder->mOffset, tstamp_usecs, (next_tstamp / NS_PER_USEC) - tstamp_usecs, b, si.is_kf, -1, picture); if (!v) { return false; } parsed++; decoded++; NS_ASSERTION(decoded <= parsed, "Expect only 1 frame per chunk per packet in WebM..."); VideoQueue().Push(v); } } return true; } void WebMReader::PushVideoPacket(NesteggPacketHolder* aItem) { mVideoPackets.PushFront(aItem); } nsresult WebMReader::Seek(int64_t aTarget, int64_t aStartTime, int64_t aEndTime, int64_t aCurrentTime) { NS_ASSERTION(mDecoder->OnDecodeThread(), "Should be on decode thread."); LOG(PR_LOG_DEBUG, ("Reader [%p] for Decoder [%p]: About to seek to %fs", this, mDecoder, aTarget/1000000.0)); if (NS_FAILED(ResetDecode())) { return NS_ERROR_FAILURE; } uint32_t trackToSeek = mHasVideo ? mVideoTrack : mAudioTrack; uint64_t target = aTarget * NS_PER_USEC; if (mSeekPreroll) { target = std::max(static_cast(aStartTime * NS_PER_USEC), target - mSeekPreroll); } int r = nestegg_track_seek(mContext, trackToSeek, target); if (r != 0) { return NS_ERROR_FAILURE; } return DecodeToTarget(aTarget); } nsresult WebMReader::GetBuffered(dom::TimeRanges* aBuffered, int64_t aStartTime) { MediaResource* resource = mDecoder->GetResource(); uint64_t timecodeScale; if (!mContext || nestegg_tstamp_scale(mContext, &timecodeScale) == -1) { return NS_OK; } // Special case completely cached files. This also handles local files. bool isFullyCached = resource->IsDataCachedToEndOfResource(0); if (isFullyCached) { uint64_t duration = 0; if (nestegg_duration(mContext, &duration) == 0) { aBuffered->Add(0, duration / NS_PER_S); } } uint32_t bufferedLength = 0; aBuffered->GetLength(&bufferedLength); // Either we the file is not fully cached, or we couldn't find a duration in // the WebM bitstream. if (!isFullyCached || !bufferedLength) { MediaResource* resource = mDecoder->GetResource(); nsTArray ranges; nsresult res = resource->GetCachedRanges(ranges); NS_ENSURE_SUCCESS(res, res); for (uint32_t index = 0; index < ranges.Length(); index++) { uint64_t start, end; bool rv = mBufferedState->CalculateBufferedForRange(ranges[index].mStart, ranges[index].mEnd, &start, &end); if (rv) { double startTime = start * timecodeScale / NS_PER_S - aStartTime; double endTime = end * timecodeScale / NS_PER_S - aStartTime; // If this range extends to the end of the file, the true end time // is the file's duration. if (resource->IsDataCachedToEndOfResource(ranges[index].mStart)) { uint64_t duration = 0; if (nestegg_duration(mContext, &duration) == 0) { endTime = duration / NS_PER_S; } } aBuffered->Add(startTime, endTime); } } } return NS_OK; } void WebMReader::NotifyDataArrived(const char* aBuffer, uint32_t aLength, int64_t aOffset) { mBufferedState->NotifyDataArrived(aBuffer, aLength, aOffset); } } // namespace mozilla