/* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*- */ /* vim:set ts=2 sw=2 sts=2 et cindent: */ /* This Source Code Form is subject to the terms of the Mozilla Public * License, v. 2.0. If a copy of the MPL was not distributed with this * file, You can obtain one at http://mozilla.org/MPL/2.0/. */ #if !defined(nsOggReader_h_) #define nsOggReader_h_ #include #include #ifdef MOZ_TREMOR #include #else #include #endif #include "nsBuiltinDecoderReader.h" #include "nsOggCodecState.h" #include "VideoUtils.h" using namespace mozilla; class nsMediaDecoder; class nsTimeRanges; class nsOggReader : public nsBuiltinDecoderReader { public: nsOggReader(nsBuiltinDecoder* aDecoder); ~nsOggReader(); virtual nsresult Init(nsBuiltinDecoderReader* aCloneDonor); virtual nsresult ResetDecode(); virtual bool DecodeAudioData(); // If the Theora granulepos has not been captured, it may read several packets // until one with a granulepos has been captured, to ensure that all packets // read have valid time info. virtual bool DecodeVideoFrame(bool &aKeyframeSkip, PRInt64 aTimeThreshold); virtual bool HasAudio() { return (mVorbisState != 0 && mVorbisState->mActive) || (mOpusState != 0 && mOpusState->mActive); } virtual bool HasVideo() { return mTheoraState != 0 && mTheoraState->mActive; } virtual nsresult ReadMetadata(nsVideoInfo* aInfo); virtual nsresult Seek(PRInt64 aTime, PRInt64 aStartTime, PRInt64 aEndTime, PRInt64 aCurrentTime); virtual nsresult GetBuffered(nsTimeRanges* aBuffered, PRInt64 aStartTime); // We use bisection to seek in buffered range. virtual bool IsSeekableInBufferedRanges() { return true; } private: bool HasSkeleton() { return mSkeletonState != 0 && mSkeletonState->mActive; } // Seeks to the keyframe preceeding the target time using available // keyframe indexes. enum IndexedSeekResult { SEEK_OK, // Success. SEEK_INDEX_FAIL, // Failure due to no index, or invalid index. SEEK_FATAL_ERROR // Error returned by a stream operation. }; IndexedSeekResult SeekToKeyframeUsingIndex(PRInt64 aTarget); // Rolls back a seek-using-index attempt, returning a failure error code. IndexedSeekResult RollbackIndexedSeek(PRInt64 aOffset); // Represents a section of contiguous media, with a start and end offset, // and the timestamps of the start and end of that range, that is cached. // Used to denote the extremities of a range in which we can seek quickly // (because it's cached). class SeekRange { public: SeekRange() : mOffsetStart(0), mOffsetEnd(0), mTimeStart(0), mTimeEnd(0) {} SeekRange(PRInt64 aOffsetStart, PRInt64 aOffsetEnd, PRInt64 aTimeStart, PRInt64 aTimeEnd) : mOffsetStart(aOffsetStart), mOffsetEnd(aOffsetEnd), mTimeStart(aTimeStart), mTimeEnd(aTimeEnd) {} bool IsNull() const { return mOffsetStart == 0 && mOffsetEnd == 0 && mTimeStart == 0 && mTimeEnd == 0; } PRInt64 mOffsetStart, mOffsetEnd; // in bytes. PRInt64 mTimeStart, mTimeEnd; // in usecs. }; // Seeks to aTarget usecs in the buffered range aRange using bisection search, // or to the keyframe prior to aTarget if we have video. aStartTime must be // the presentation time at the start of media, and aEndTime the time at // end of media. aRanges must be the time/byte ranges buffered in the media // cache as per GetSeekRanges(). nsresult SeekInBufferedRange(PRInt64 aTarget, PRInt64 aStartTime, PRInt64 aEndTime, const nsTArray& aRanges, const SeekRange& aRange); // Seeks to before aTarget usecs in media using bisection search. If the media // has video, this will seek to before the keyframe required to render the // media at aTarget. Will use aRanges in order to narrow the bisection // search space. aStartTime must be the presentation time at the start of // media, and aEndTime the time at end of media. aRanges must be the time/byte // ranges buffered in the media cache as per GetSeekRanges(). nsresult SeekInUnbuffered(PRInt64 aTarget, PRInt64 aStartTime, PRInt64 aEndTime, const nsTArray& aRanges); // Get the end time of aEndOffset. This is the playback position we'd reach // after playback finished at aEndOffset. PRInt64 RangeEndTime(PRInt64 aEndOffset); // Get the end time of aEndOffset, without reading before aStartOffset. // This is the playback position we'd reach after playback finished at // aEndOffset. If bool aCachedDataOnly is true, then we'll only read // from data which is cached in the media cached, otherwise we'll do // regular blocking reads from the media stream. If bool aCachedDataOnly // is true, this can safely be called on the main thread, otherwise it // must be called on the state machine thread. PRInt64 RangeEndTime(PRInt64 aStartOffset, PRInt64 aEndOffset, bool aCachedDataOnly); // Get the start time of the range beginning at aOffset. This is the start // time of the first frame and or audio sample we'd be able to play if we // started playback at aOffset. PRInt64 RangeStartTime(PRInt64 aOffset); // Performs a seek bisection to move the media stream's read cursor to the // last ogg page boundary which has end time before aTarget usecs on both the // Theora and Vorbis bitstreams. Limits its search to data inside aRange; // i.e. it will only read inside of the aRange's start and end offsets. // aFuzz is the number of usecs of leniency we'll allow; we'll terminate the // seek when we land in the range (aTime - aFuzz, aTime) usecs. nsresult SeekBisection(PRInt64 aTarget, const SeekRange& aRange, PRUint32 aFuzz); // Returns true if the serial number is for a stream we encountered // while reading metadata. Call on the main thread only. bool IsKnownStream(PRUint32 aSerial); // Fills aRanges with SeekRanges denoting the sections of the media which // have been downloaded and are stored in the media cache. The reader // monitor must must be held with exactly one lock count. The MediaResource // must be pinned while calling this. nsresult GetSeekRanges(nsTArray& aRanges); // Returns the range in which you should perform a seek bisection if // you wish to seek to aTarget usecs, given the known (buffered) byte ranges // in aRanges. If aExact is true, we only return an exact copy of a // range in which aTarget lies, or a null range if aTarget isn't contained // in any of the (buffered) ranges. Otherwise, when aExact is false, // we'll construct the smallest possible range we can, based on the times // and byte offsets known in aRanges. We can then use this to minimize our // bisection's search space when the target isn't in a known buffered range. SeekRange SelectSeekRange(const nsTArray& aRanges, PRInt64 aTarget, PRInt64 aStartTime, PRInt64 aEndTime, bool aExact); private: // Decodes a packet of Vorbis data, and inserts its samples into the // audio queue. nsresult DecodeVorbis(ogg_packet* aPacket); // Decodes a packet of Opus data, and inserts its samples into the // audio queue. nsresult DecodeOpus(ogg_packet* aPacket); // Decodes a packet of Theora data, and inserts its frame into the // video queue. May return NS_ERROR_OUT_OF_MEMORY. Caller must have obtained // the reader's monitor. aTimeThreshold is the current playback position // in media time in microseconds. Frames with an end time before this will // not be enqueued. nsresult DecodeTheora(ogg_packet* aPacket, PRInt64 aTimeThreshold); // Read a page of data from the Ogg file. Returns the offset of the start // of the page, or -1 if the page read failed. PRInt64 ReadOggPage(ogg_page* aPage); // Reads and decodes header packets for aState, until either header decode // fails, or is complete. Initializes the codec state before returning. // Returns true if reading headers and initializtion of the stream // succeeds. bool ReadHeaders(nsOggCodecState* aState); // Returns the next Ogg packet for an bitstream/codec state. Returns a // pointer to an ogg_packet on success, or nsnull if the read failed. // The caller is responsible for deleting the packet and its |packet| field. ogg_packet* NextOggPacket(nsOggCodecState* aCodecState); // Maps Ogg serialnos to nsOggStreams. nsClassHashtable mCodecStates; // Array of serial numbers of streams that were encountered during // initial metadata load. Written on state machine thread during // metadata loading and read on the main thread only after metadata // is loaded. nsAutoTArray mKnownStreams; // Decode state of the Theora bitstream we're decoding, if we have video. nsTheoraState* mTheoraState; // Decode state of the Vorbis bitstream we're decoding, if we have audio. nsVorbisState* mVorbisState; // Decode state of the Opus bitstream we're decoding, if we have one. nsOpusState *mOpusState; // Represents the user pref media.opus.enabled at the time our // contructor was called. We can't check it dynamically because // we're not on the main thread; bool mOpusEnabled; // Decode state of the Skeleton bitstream. nsSkeletonState* mSkeletonState; // Ogg decoding state. ogg_sync_state mOggState; // Vorbis/Theora data used to compute timestamps. This is written on the // decoder thread and read on the main thread. All reading on the main // thread must be done after metadataloaded. We can't use the existing // data in the codec states due to threading issues. You must check the // associated mTheoraState or mVorbisState pointer is non-null before // using this codec data. PRUint32 mVorbisSerial; PRUint32 mTheoraSerial; vorbis_info mVorbisInfo; th_info mTheoraInfo; // The offset of the end of the last page we've read, or the start of // the page we're about to read. PRInt64 mPageOffset; // The picture region inside Theora frame to be displayed, if we have // a Theora video track. nsIntRect mPicture; }; #endif