/* -*- Mode: C++; tab-width: 8; indent-tabs-mode: nil; c-basic-offset: 2 -*- */ /* vim: set ts=8 sts=2 et sw=2 tw=80: */ /* This Source Code Form is subject to the terms of the Mozilla Public * License, v. 2.0. If a copy of the MPL was not distributed with this * file, You can obtain one at http://mozilla.org/MPL/2.0/. */ #if !defined(MediaInfo_h) # define MediaInfo_h # include "mozilla/UniquePtr.h" # include "mozilla/RefPtr.h" # include "nsDataHashtable.h" # include "nsString.h" # include "nsTArray.h" # include "AudioConfig.h" # include "ImageTypes.h" # include "MediaData.h" # include "TimeUnits.h" # include "mozilla/gfx/Point.h" // for gfx::IntSize # include "mozilla/gfx/Rect.h" // for gfx::IntRect # include "mozilla/gfx/Types.h" // for gfx::ColorDepth namespace mozilla { class AudioInfo; class VideoInfo; class TextInfo; class MetadataTag { public: MetadataTag(const nsACString& aKey, const nsACString& aValue) : mKey(aKey), mValue(aValue) {} nsCString mKey; nsCString mValue; bool operator==(const MetadataTag& rhs) const { return mKey == rhs.mKey && mValue == rhs.mValue; } }; typedef nsDataHashtable MetadataTags; class TrackInfo { public: enum TrackType { kUndefinedTrack, kAudioTrack, kVideoTrack, kTextTrack }; TrackInfo(TrackType aType, const nsAString& aId, const nsAString& aKind, const nsAString& aLabel, const nsAString& aLanguage, bool aEnabled, uint32_t aTrackId) : mId(aId), mKind(aKind), mLabel(aLabel), mLanguage(aLanguage), mEnabled(aEnabled), mTrackId(aTrackId), mIsRenderedExternally(false), mType(aType) { MOZ_COUNT_CTOR(TrackInfo); } // Only used for backward compatibility. Do not use in new code. void Init(const nsAString& aId, const nsAString& aKind, const nsAString& aLabel, const nsAString& aLanguage, bool aEnabled) { mId = aId; mKind = aKind; mLabel = aLabel; mLanguage = aLanguage; mEnabled = aEnabled; } // Fields common with MediaTrack object. nsString mId; nsString mKind; nsString mLabel; nsString mLanguage; bool mEnabled; uint32_t mTrackId; nsCString mMimeType; media::TimeUnit mDuration; media::TimeUnit mMediaTime; CryptoTrack mCrypto; nsTArray mTags; // True if the track is gonna be (decrypted)/decoded and // rendered directly by non-gecko components. bool mIsRenderedExternally; virtual AudioInfo* GetAsAudioInfo() { return nullptr; } virtual VideoInfo* GetAsVideoInfo() { return nullptr; } virtual TextInfo* GetAsTextInfo() { return nullptr; } virtual const AudioInfo* GetAsAudioInfo() const { return nullptr; } virtual const VideoInfo* GetAsVideoInfo() const { return nullptr; } virtual const TextInfo* GetAsTextInfo() const { return nullptr; } bool IsAudio() const { return !!GetAsAudioInfo(); } bool IsVideo() const { return !!GetAsVideoInfo(); } bool IsText() const { return !!GetAsTextInfo(); } TrackType GetType() const { return mType; } bool virtual IsValid() const = 0; virtual UniquePtr Clone() const = 0; MOZ_COUNTED_DTOR_VIRTUAL(TrackInfo) protected: TrackInfo(const TrackInfo& aOther) { mId = aOther.mId; mKind = aOther.mKind; mLabel = aOther.mLabel; mLanguage = aOther.mLanguage; mEnabled = aOther.mEnabled; mTrackId = aOther.mTrackId; mMimeType = aOther.mMimeType; mDuration = aOther.mDuration; mMediaTime = aOther.mMediaTime; mCrypto = aOther.mCrypto; mIsRenderedExternally = aOther.mIsRenderedExternally; mType = aOther.mType; mTags = aOther.mTags; MOZ_COUNT_CTOR(TrackInfo); } bool IsEqualTo(const TrackInfo& rhs) const; private: TrackType mType; }; // String version of track type. const char* TrackTypeToStr(TrackInfo::TrackType aTrack); // Stores info relevant to presenting media frames. class VideoInfo : public TrackInfo { public: enum Rotation { kDegree_0 = 0, kDegree_90 = 90, kDegree_180 = 180, kDegree_270 = 270, }; VideoInfo() : VideoInfo(-1, -1) {} explicit VideoInfo(int32_t aWidth, int32_t aHeight) : VideoInfo(gfx::IntSize(aWidth, aHeight)) {} explicit VideoInfo(const gfx::IntSize& aSize) : TrackInfo(kVideoTrack, NS_LITERAL_STRING("2"), NS_LITERAL_STRING("main"), EmptyString(), EmptyString(), true, 2), mDisplay(aSize), mStereoMode(StereoMode::MONO), mImage(aSize), mCodecSpecificConfig(new MediaByteBuffer), mExtraData(new MediaByteBuffer), mRotation(kDegree_0), mImageRect(gfx::IntRect(gfx::IntPoint(), aSize)) {} VideoInfo(const VideoInfo& aOther) = default; bool operator==(const VideoInfo& rhs) const; bool IsValid() const override { return mDisplay.width > 0 && mDisplay.height > 0; } VideoInfo* GetAsVideoInfo() override { return this; } const VideoInfo* GetAsVideoInfo() const override { return this; } UniquePtr Clone() const override { return MakeUnique(*this); } void SetAlpha(bool aAlphaPresent) { mAlphaPresent = aAlphaPresent; } bool HasAlpha() const { return mAlphaPresent; } gfx::IntRect ImageRect() const { if (mImageRect.Width() < 0 || mImageRect.Height() < 0) { return gfx::IntRect(0, 0, mImage.width, mImage.height); } return mImageRect; } void SetImageRect(const gfx::IntRect& aRect) { mImageRect = aRect; } // Returned the crop rectangle scaled to aWidth/aHeight size relative to // mImage size. // If aWidth and aHeight are identical to the original // mImage.width/mImage.height then the scaling ratio will be 1. This is used // for when the frame size is different from what the container reports. This // is legal in WebM, and we will preserve the ratio of the crop rectangle as // it was reported relative to the picture size reported by the container. gfx::IntRect ScaledImageRect(int64_t aWidth, int64_t aHeight) const { if ((aWidth == mImage.width && aHeight == mImage.height) || !mImage.width || !mImage.height) { return ImageRect(); } gfx::IntRect imageRect = ImageRect(); int64_t w = (aWidth * imageRect.Width()) / mImage.width; int64_t h = (aHeight * imageRect.Height()) / mImage.height; if (!w || !h) { return imageRect; } imageRect.x = (imageRect.x * aWidth) / mImage.width; imageRect.y = (imageRect.y * aHeight) / mImage.height; imageRect.SetWidth(w); imageRect.SetHeight(h); return imageRect; } Rotation ToSupportedRotation(int32_t aDegree) const { switch (aDegree) { case 90: return kDegree_90; case 180: return kDegree_180; case 270: return kDegree_270; default: NS_WARNING_ASSERTION(aDegree == 0, "Invalid rotation degree, ignored"); return kDegree_0; } } // Size in pixels at which the video is rendered. This is after it has // been scaled by its aspect ratio. gfx::IntSize mDisplay; // Indicates the frame layout for single track stereo videos. StereoMode mStereoMode; // Size of the decoded video's image. gfx::IntSize mImage; RefPtr mCodecSpecificConfig; RefPtr mExtraData; // Describing how many degrees video frames should be rotated in clock-wise to // get correct view. Rotation mRotation; // Should be 8, 10 or 12. Default value is 8. gfx::ColorDepth mColorDepth = gfx::ColorDepth::COLOR_8; gfx::YUVColorSpace mColorSpace = gfx::YUVColorSpace::UNKNOWN; // True indicates no restriction on Y, U, V values (otherwise 16-235 for 8 // bits etc) gfx::ColorRange mColorRange = gfx::ColorRange::LIMITED; Maybe GetFrameRate() const { return mFrameRate; } void SetFrameRate(int32_t aRate) { mFrameRate = Some(aRate); } private: // mImage may be cropped; currently only used with the WebM container. // A negative width or height indicate that no cropping is to occur. gfx::IntRect mImageRect; // Indicates whether or not frames may contain alpha information. bool mAlphaPresent = false; Maybe mFrameRate; }; class AudioInfo : public TrackInfo { public: AudioInfo() : TrackInfo(kAudioTrack, NS_LITERAL_STRING("1"), NS_LITERAL_STRING("main"), EmptyString(), EmptyString(), true, 1), mRate(0), mChannels(0), mChannelMap(AudioConfig::ChannelLayout::UNKNOWN_MAP), mBitDepth(0), mProfile(0), mExtendedProfile(0), mCodecSpecificConfig(new MediaByteBuffer), mExtraData(new MediaByteBuffer) {} AudioInfo(const AudioInfo& aOther) = default; bool operator==(const AudioInfo& rhs) const; static const uint32_t MAX_RATE = 640000; bool IsValid() const override { return mChannels > 0 && mRate > 0 && mRate <= MAX_RATE; } AudioInfo* GetAsAudioInfo() override { return this; } const AudioInfo* GetAsAudioInfo() const override { return this; } UniquePtr Clone() const override { return MakeUnique(*this); } // Sample rate. uint32_t mRate; // Number of audio channels. uint32_t mChannels; // The AudioConfig::ChannelLayout map. Channels are ordered as per SMPTE // definition. A value of UNKNOWN_MAP indicates unknown layout. // ChannelMap is an unsigned bitmap compatible with Windows' WAVE and FFmpeg // channel map. AudioConfig::ChannelLayout::ChannelMap mChannelMap; // Bits per sample. uint32_t mBitDepth; // Codec profile. int8_t mProfile; // Extended codec profile. int8_t mExtendedProfile; RefPtr mCodecSpecificConfig; RefPtr mExtraData; }; class EncryptionInfo { public: EncryptionInfo() : mEncrypted(false) {} struct InitData { template InitData(const nsAString& aType, AInitDatas&& aInitData) : mType(aType), mInitData(std::forward(aInitData)) {} // Encryption type to be passed to JS. Usually `cenc'. nsString mType; // Encryption data. nsTArray mInitData; }; typedef nsTArray InitDatas; // True if the stream has encryption metadata bool IsEncrypted() const { return mEncrypted; } void Reset() { mEncrypted = false; mInitDatas.Clear(); } template void AddInitData(const nsAString& aType, AInitDatas&& aInitData) { mInitDatas.AppendElement( InitData(aType, std::forward(aInitData))); mEncrypted = true; } void AddInitData(const EncryptionInfo& aInfo) { mInitDatas.AppendElements(aInfo.mInitDatas); mEncrypted = !!mInitDatas.Length(); } // One 'InitData' per encrypted buffer. InitDatas mInitDatas; private: bool mEncrypted; }; class MediaInfo { public: bool HasVideo() const { return mVideo.IsValid(); } void EnableVideo() { if (HasVideo()) { return; } // Set dummy values so that HasVideo() will return true; // See VideoInfo::IsValid() mVideo.mDisplay = gfx::IntSize(1, 1); } bool HasAudio() const { return mAudio.IsValid(); } void EnableAudio() { if (HasAudio()) { return; } // Set dummy values so that HasAudio() will return true; // See AudioInfo::IsValid() mAudio.mChannels = 2; mAudio.mRate = 44100; } bool IsEncrypted() const { return (HasAudio() && mAudio.mCrypto.IsEncrypted()) || (HasVideo() && mVideo.mCrypto.IsEncrypted()); } bool HasValidMedia() const { return HasVideo() || HasAudio(); } // TODO: Store VideoInfo and AudioIndo in arrays to support multi-tracks. VideoInfo mVideo; AudioInfo mAudio; // If the metadata includes a duration, we store it here. media::NullableTimeUnit mMetadataDuration; // The Ogg reader tries to kinda-sorta compute the duration by seeking to the // end and determining the timestamp of the last frame. This isn't useful as // a duration until we know the start time, so we need to track it separately. media::NullableTimeUnit mUnadjustedMetadataEndTime; // True if the media is seekable (i.e. supports random access). bool mMediaSeekable = true; // True if the media is only seekable within its buffered ranges. bool mMediaSeekableOnlyInBufferedRanges = false; EncryptionInfo mCrypto; // The minimum of start times of audio and video tracks. // Use to map the zero time on the media timeline to the first frame. media::TimeUnit mStartTime; }; class TrackInfoSharedPtr { NS_INLINE_DECL_THREADSAFE_REFCOUNTING(TrackInfoSharedPtr) public: TrackInfoSharedPtr(const TrackInfo& aOriginal, uint32_t aStreamID) : mInfo(aOriginal.Clone()), mStreamSourceID(aStreamID), mMimeType(mInfo->mMimeType) {} uint32_t GetID() const { return mStreamSourceID; } operator const TrackInfo*() const { return mInfo.get(); } const TrackInfo* operator*() const { return mInfo.get(); } const TrackInfo* operator->() const { MOZ_ASSERT(mInfo.get(), "dereferencing a UniquePtr containing nullptr"); return mInfo.get(); } const AudioInfo* GetAsAudioInfo() const { return mInfo ? mInfo->GetAsAudioInfo() : nullptr; } const VideoInfo* GetAsVideoInfo() const { return mInfo ? mInfo->GetAsVideoInfo() : nullptr; } const TextInfo* GetAsTextInfo() const { return mInfo ? mInfo->GetAsTextInfo() : nullptr; } private: ~TrackInfoSharedPtr() = default; UniquePtr mInfo; // A unique ID, guaranteed to change when changing streams. uint32_t mStreamSourceID; public: const nsCString& mMimeType; }; } // namespace mozilla #endif // MediaInfo_h