/* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*- */ /* vim:set ts=2 sw=2 sts=2 et cindent: */ /* ***** BEGIN LICENSE BLOCK ***** * Version: MPL 1.1/GPL 2.0/LGPL 2.1 * * The contents of this file are subject to the Mozilla Public License Version * 1.1 (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * http://www.mozilla.org/MPL/ * * Software distributed under the License is distributed on an "AS IS" basis, * WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License * for the specific language governing rights and limitations under the * License. * * The Original Code is Mozilla code. * * The Initial Developer of the Original Code is the Mozilla Corporation. * Portions created by the Initial Developer are Copyright (C) 2007 * the Initial Developer. All Rights Reserved. * * Contributor(s): * Chris Double * Chris Pearce * * Alternatively, the contents of this file may be used under the terms of * either the GNU General Public License Version 2 or later (the "GPL"), or * the GNU Lesser General Public License Version 2.1 or later (the "LGPL"), * in which case the provisions of the GPL or the LGPL are applicable instead * of those above. If you wish to allow use of your version of this file only * under the terms of either the GPL or the LGPL, and not to allow others to * use your version of this file under the terms of the MPL, indicate your * decision by deleting the provisions above and replace them with the notice * and other provisions required by the GPL or the LGPL. If you do not delete * the provisions above, a recipient may use your version of this file under * the terms of any one of the MPL, the GPL or the LGPL. * * ***** END LICENSE BLOCK ***** */ #if !defined(nsOggReader_h_) #define nsOggReader_h_ #include #include #ifdef MOZ_TREMOR #include #else #include #endif #include "nsBuiltinDecoderReader.h" #include "nsOggCodecState.h" #include "VideoUtils.h" using namespace mozilla; class nsMediaDecoder; class nsTimeRanges; class nsOggReader : public nsBuiltinDecoderReader { public: nsOggReader(nsBuiltinDecoder* aDecoder); ~nsOggReader(); virtual nsresult Init(nsBuiltinDecoderReader* aCloneDonor); virtual nsresult ResetDecode(); virtual PRBool DecodeAudioData(); // If the Theora granulepos has not been captured, it may read several packets // until one with a granulepos has been captured, to ensure that all packets // read have valid time info. virtual PRBool DecodeVideoFrame(PRBool &aKeyframeSkip, PRInt64 aTimeThreshold); virtual PRBool HasAudio() { mozilla::ReentrantMonitorAutoEnter mon(mReentrantMonitor); return mVorbisState != 0 && mVorbisState->mActive; } virtual PRBool HasVideo() { mozilla::ReentrantMonitorAutoEnter mon(mReentrantMonitor); return mTheoraState != 0 && mTheoraState->mActive; } virtual nsresult ReadMetadata(nsVideoInfo* aInfo); virtual nsresult Seek(PRInt64 aTime, PRInt64 aStartTime, PRInt64 aEndTime, PRInt64 aCurrentTime); virtual nsresult GetBuffered(nsTimeRanges* aBuffered, PRInt64 aStartTime); private: PRBool HasSkeleton() { ReentrantMonitorAutoEnter mon(mReentrantMonitor); return mSkeletonState != 0 && mSkeletonState->mActive; } // Returns PR_TRUE if we should decode up to the seek target rather than // seeking to the target using a bisection search or index-assisted seek. // We should do this if the seek target (aTarget, in usecs), lies not too far // ahead of the current playback position (aCurrentTime, in usecs). PRBool CanDecodeToTarget(PRInt64 aTarget, PRInt64 aCurrentTime); // Seeks to the keyframe preceeding the target time using available // keyframe indexes. enum IndexedSeekResult { SEEK_OK, // Success. SEEK_INDEX_FAIL, // Failure due to no index, or invalid index. SEEK_FATAL_ERROR // Error returned by a stream operation. }; IndexedSeekResult SeekToKeyframeUsingIndex(PRInt64 aTarget); // Rolls back a seek-using-index attempt, returning a failure error code. IndexedSeekResult RollbackIndexedSeek(PRInt64 aOffset); // Represents a section of contiguous media, with a start and end offset, // and the timestamps of the start and end of that range, that is cached. // Used to denote the extremities of a range in which we can seek quickly // (because it's cached). class SeekRange { public: SeekRange() : mOffsetStart(0), mOffsetEnd(0), mTimeStart(0), mTimeEnd(0) {} SeekRange(PRInt64 aOffsetStart, PRInt64 aOffsetEnd, PRInt64 aTimeStart, PRInt64 aTimeEnd) : mOffsetStart(aOffsetStart), mOffsetEnd(aOffsetEnd), mTimeStart(aTimeStart), mTimeEnd(aTimeEnd) {} PRBool IsNull() const { return mOffsetStart == 0 && mOffsetEnd == 0 && mTimeStart == 0 && mTimeEnd == 0; } PRInt64 mOffsetStart, mOffsetEnd; // in bytes. PRInt64 mTimeStart, mTimeEnd; // in usecs. }; // Seeks to aTarget usecs in the buffered range aRange using bisection search, // or to the keyframe prior to aTarget if we have video. aStartTime must be // the presentation time at the start of media, and aEndTime the time at // end of media. aRanges must be the time/byte ranges buffered in the media // cache as per GetSeekRanges(). nsresult SeekInBufferedRange(PRInt64 aTarget, PRInt64 aStartTime, PRInt64 aEndTime, const nsTArray& aRanges, const SeekRange& aRange); // Seeks to before aTarget usecs in media using bisection search. If the media // has video, this will seek to before the keyframe required to render the // media at aTarget. Will use aRanges in order to narrow the bisection // search space. aStartTime must be the presentation time at the start of // media, and aEndTime the time at end of media. aRanges must be the time/byte // ranges buffered in the media cache as per GetSeekRanges(). nsresult SeekInUnbuffered(PRInt64 aTarget, PRInt64 aStartTime, PRInt64 aEndTime, const nsTArray& aRanges); // Get the end time of aEndOffset. This is the playback position we'd reach // after playback finished at aEndOffset. PRInt64 RangeEndTime(PRInt64 aEndOffset); // Get the end time of aEndOffset, without reading before aStartOffset. // This is the playback position we'd reach after playback finished at // aEndOffset. If PRBool aCachedDataOnly is PR_TRUE, then we'll only read // from data which is cached in the media cached, otherwise we'll do // regular blocking reads from the media stream. If PRBool aCachedDataOnly // is PR_TRUE, this can safely be called on the main thread, otherwise it // must be called on the state machine thread. PRInt64 RangeEndTime(PRInt64 aStartOffset, PRInt64 aEndOffset, PRBool aCachedDataOnly); // Get the start time of the range beginning at aOffset. This is the start // time of the first frame and or audio sample we'd be able to play if we // started playback at aOffset. PRInt64 RangeStartTime(PRInt64 aOffset); // Performs a seek bisection to move the media stream's read cursor to the // last ogg page boundary which has end time before aTarget usecs on both the // Theora and Vorbis bitstreams. Limits its search to data inside aRange; // i.e. it will only read inside of the aRange's start and end offsets. // aFuzz is the number of usecs of leniency we'll allow; we'll terminate the // seek when we land in the range (aTime - aFuzz, aTime) usecs. nsresult SeekBisection(PRInt64 aTarget, const SeekRange& aRange, PRUint32 aFuzz); // Returns true if the serial number is for a stream we encountered // while reading metadata. Call on the main thread only. PRBool IsKnownStream(PRUint32 aSerial); // Fills aRanges with SeekRanges denoting the sections of the media which // have been downloaded and are stored in the media cache. The reader // monitor must must be held with exactly one lock count. The nsMediaStream // must be pinned while calling this. nsresult GetSeekRanges(nsTArray& aRanges); // Returns the range in which you should perform a seek bisection if // you wish to seek to aTarget usecs, given the known (buffered) byte ranges // in aRanges. If aExact is PR_TRUE, we only return an exact copy of a // range in which aTarget lies, or a null range if aTarget isn't contained // in any of the (buffered) ranges. Otherwise, when aExact is PR_FALSE, // we'll construct the smallest possible range we can, based on the times // and byte offsets known in aRanges. We can then use this to minimize our // bisection's search space when the target isn't in a known buffered range. SeekRange SelectSeekRange(const nsTArray& aRanges, PRInt64 aTarget, PRInt64 aStartTime, PRInt64 aEndTime, PRBool aExact); private: // Decodes a packet of Vorbis data, and inserts its samples into the // audio queue. nsresult DecodeVorbis(ogg_packet* aPacket); // Decodes a packet of Theora data, and inserts its frame into the // video queue. May return NS_ERROR_OUT_OF_MEMORY. Caller must have obtained // the reader's monitor. aTimeThreshold is the current playback position // in media time in microseconds. Frames with an end time before this will // not be enqueued. nsresult DecodeTheora(ogg_packet* aPacket, PRInt64 aTimeThreshold); // Read a page of data from the Ogg file. Returns the offset of the start // of the page, or -1 if the page read failed. PRInt64 ReadOggPage(ogg_page* aPage); // Reads and decodes header packets for aState, until either header decode // fails, or is complete. Initializes the codec state before returning. // Returns PR_TRUE if reading headers and initializtion of the stream // succeeds. PRBool ReadHeaders(nsOggCodecState* aState); // Returns the next Ogg packet for an bitstream/codec state. Returns a // pointer to an ogg_packet on success, or nsnull if the read failed. // The caller is responsible for deleting the packet and its |packet| field. ogg_packet* NextOggPacket(nsOggCodecState* aCodecState); // Maps Ogg serialnos to nsOggStreams. nsClassHashtable mCodecStates; // Array of serial numbers of streams that were encountered during // initial metadata load. Written on state machine thread during // metadata loading and read on the main thread only after metadata // is loaded. nsAutoTArray mKnownStreams; // Decode state of the Theora bitstream we're decoding, if we have video. nsTheoraState* mTheoraState; // Decode state of the Vorbis bitstream we're decoding, if we have audio. nsVorbisState* mVorbisState; // Decode state of the Skeleton bitstream. nsSkeletonState* mSkeletonState; // Ogg decoding state. ogg_sync_state mOggState; // Vorbis/Theora data used to compute timestamps. This is written on the // decoder thread and read on the main thread. All reading on the main // thread must be done after metadataloaded. We can't use the existing // data in the codec states due to threading issues. You must check the // associated mTheoraState or mVorbisState pointer is non-null before // using this codec data. PRUint32 mVorbisSerial; PRUint32 mTheoraSerial; vorbis_info mVorbisInfo; th_info mTheoraInfo; // The offset of the end of the last page we've read, or the start of // the page we're about to read. PRInt64 mPageOffset; }; #endif