/* * Copyright (c) 2015 The WebRTC project authors. All Rights Reserved. * * Use of this source code is governed by a BSD-style license * that can be found in the LICENSE file in the root of the source * tree. An additional intellectual property rights grant can be found * in the file PATENTS. All contributing project authors may * be found in the AUTHORS file in the root of the source tree. * */ #import "RTCVideoDecoderH264.h" #import #import "base/RTCVideoFrame.h" #import "base/RTCVideoFrameBuffer.h" #import "components/video_frame_buffer/RTCCVPixelBuffer.h" #import "helpers.h" #import "helpers/scoped_cftyperef.h" #if defined(WEBRTC_IOS) #import "helpers/UIDevice+RTCDevice.h" #endif #include "modules/video_coding/include/video_error_codes.h" #include "rtc_base/checks.h" #include "rtc_base/logging.h" #include "rtc_base/time_utils.h" #include "sdk/objc/components/video_codec/nalu_rewriter.h" // Struct that we pass to the decoder per frame to decode. We receive it again // in the decoder callback. struct RTCFrameDecodeParams { RTCFrameDecodeParams(RTCVideoDecoderCallback cb, int64_t ts) : callback(cb), timestamp(ts) {} RTCVideoDecoderCallback callback; int64_t timestamp; }; @interface RTC_OBJC_TYPE (RTCVideoDecoderH264) () - (void)setError : (OSStatus)error; @end // This is the callback function that VideoToolbox calls when decode is // complete. void decompressionOutputCallback(void *decoderRef, void *params, OSStatus status, VTDecodeInfoFlags infoFlags, CVImageBufferRef imageBuffer, CMTime timestamp, CMTime duration) { std::unique_ptr decodeParams( reinterpret_cast(params)); if (status != noErr) { RTC_OBJC_TYPE(RTCVideoDecoderH264) *decoder = (__bridge RTC_OBJC_TYPE(RTCVideoDecoderH264) *)decoderRef; [decoder setError:status]; RTC_LOG(LS_ERROR) << "Failed to decode frame. Status: " << status; return; } // TODO(tkchin): Handle CVO properly. RTC_OBJC_TYPE(RTCCVPixelBuffer) *frameBuffer = [[RTC_OBJC_TYPE(RTCCVPixelBuffer) alloc] initWithPixelBuffer:imageBuffer]; RTC_OBJC_TYPE(RTCVideoFrame) *decodedFrame = [[RTC_OBJC_TYPE(RTCVideoFrame) alloc] initWithBuffer:frameBuffer rotation:RTCVideoRotation_0 timeStampNs:CMTimeGetSeconds(timestamp) * rtc::kNumNanosecsPerSec]; decodedFrame.timeStamp = decodeParams->timestamp; decodeParams->callback(decodedFrame); } // Decoder. @implementation RTC_OBJC_TYPE (RTCVideoDecoderH264) { CMVideoFormatDescriptionRef _videoFormat; CMMemoryPoolRef _memoryPool; VTDecompressionSessionRef _decompressionSession; RTCVideoDecoderCallback _callback; OSStatus _error; } - (instancetype)init { self = [super init]; if (self) { _memoryPool = CMMemoryPoolCreate(nil); } return self; } - (void)dealloc { CMMemoryPoolInvalidate(_memoryPool); CFRelease(_memoryPool); [self destroyDecompressionSession]; [self setVideoFormat:nullptr]; } - (NSInteger)startDecodeWithNumberOfCores:(int)numberOfCores { return WEBRTC_VIDEO_CODEC_OK; } // TODO(bugs.webrtc.org/15444): Remove obsolete missingFrames param. - (NSInteger)decode:(RTC_OBJC_TYPE(RTCEncodedImage) *)inputImage missingFrames:(BOOL)missingFrames codecSpecificInfo:(nullable id)info renderTimeMs:(int64_t)renderTimeMs { RTC_DCHECK(inputImage.buffer); if (_error != noErr) { RTC_LOG(LS_WARNING) << "Last frame decode failed."; _error = noErr; return WEBRTC_VIDEO_CODEC_ERROR; } rtc::ScopedCFTypeRef inputFormat = rtc::ScopedCF(webrtc::CreateVideoFormatDescription((uint8_t *)inputImage.buffer.bytes, inputImage.buffer.length)); if (inputFormat) { // Check if the video format has changed, and reinitialize decoder if // needed. if (!CMFormatDescriptionEqual(inputFormat.get(), _videoFormat)) { [self setVideoFormat:inputFormat.get()]; int resetDecompressionSessionError = [self resetDecompressionSession]; if (resetDecompressionSessionError != WEBRTC_VIDEO_CODEC_OK) { return resetDecompressionSessionError; } } } if (!_videoFormat) { // We received a frame but we don't have format information so we can't // decode it. // This can happen after backgrounding. We need to wait for the next // sps/pps before we can resume so we request a keyframe by returning an // error. RTC_LOG(LS_WARNING) << "Missing video format. Frame with sps/pps required."; return WEBRTC_VIDEO_CODEC_ERROR; } CMSampleBufferRef sampleBuffer = nullptr; if (!webrtc::H264AnnexBBufferToCMSampleBuffer((uint8_t *)inputImage.buffer.bytes, inputImage.buffer.length, _videoFormat, &sampleBuffer, _memoryPool)) { return WEBRTC_VIDEO_CODEC_ERROR; } RTC_DCHECK(sampleBuffer); VTDecodeFrameFlags decodeFlags = kVTDecodeFrame_EnableAsynchronousDecompression; std::unique_ptr frameDecodeParams; frameDecodeParams.reset(new RTCFrameDecodeParams(_callback, inputImage.timeStamp)); OSStatus status = VTDecompressionSessionDecodeFrame( _decompressionSession, sampleBuffer, decodeFlags, frameDecodeParams.release(), nullptr); #if defined(WEBRTC_IOS) // Re-initialize the decoder if we have an invalid session while the app is // active or decoder malfunctions and retry the decode request. if ((status == kVTInvalidSessionErr || status == kVTVideoDecoderMalfunctionErr) && [self resetDecompressionSession] == WEBRTC_VIDEO_CODEC_OK) { RTC_LOG(LS_INFO) << "Failed to decode frame with code: " << status << " retrying decode after decompression session reset"; frameDecodeParams.reset(new RTCFrameDecodeParams(_callback, inputImage.timeStamp)); status = VTDecompressionSessionDecodeFrame( _decompressionSession, sampleBuffer, decodeFlags, frameDecodeParams.release(), nullptr); } #endif CFRelease(sampleBuffer); if (status != noErr) { RTC_LOG(LS_ERROR) << "Failed to decode frame with code: " << status; return WEBRTC_VIDEO_CODEC_ERROR; } return WEBRTC_VIDEO_CODEC_OK; } - (void)setCallback:(RTCVideoDecoderCallback)callback { _callback = callback; } - (void)setError:(OSStatus)error { _error = error; } - (NSInteger)releaseDecoder { // Need to invalidate the session so that callbacks no longer occur and it // is safe to null out the callback. [self destroyDecompressionSession]; [self setVideoFormat:nullptr]; _callback = nullptr; return WEBRTC_VIDEO_CODEC_OK; } #pragma mark - Private - (int)resetDecompressionSession { [self destroyDecompressionSession]; // Need to wait for the first SPS to initialize decoder. if (!_videoFormat) { return WEBRTC_VIDEO_CODEC_OK; } // Set keys for OpenGL and IOSurface compatibilty, which makes the encoder // create pixel buffers with GPU backed memory. The intent here is to pass // the pixel buffers directly so we avoid a texture upload later during // rendering. This currently is moot because we are converting back to an // I420 frame after decode, but eventually we will be able to plumb // CVPixelBuffers directly to the renderer. // TODO(tkchin): Maybe only set OpenGL/IOSurface keys if we know that that // we can pass CVPixelBuffers as native handles in decoder output. NSDictionary *attributes = @{ #if defined(WEBRTC_IOS) && (TARGET_OS_MACCATALYST || TARGET_OS_SIMULATOR) (NSString *)kCVPixelBufferMetalCompatibilityKey : @(YES), #elif defined(WEBRTC_IOS) (NSString *)kCVPixelBufferOpenGLESCompatibilityKey : @(YES), #elif defined(WEBRTC_MAC) && !defined(WEBRTC_ARCH_ARM64) (NSString *)kCVPixelBufferOpenGLCompatibilityKey : @(YES), #endif #if !(TARGET_OS_SIMULATOR) (NSString *)kCVPixelBufferIOSurfacePropertiesKey : @{}, #endif (NSString *) kCVPixelBufferPixelFormatTypeKey : @(kCVPixelFormatType_420YpCbCr8BiPlanarFullRange), }; VTDecompressionOutputCallbackRecord record = { decompressionOutputCallback, (__bridge void *)self, }; OSStatus status = VTDecompressionSessionCreate(nullptr, _videoFormat, nullptr, (__bridge CFDictionaryRef)attributes, &record, &_decompressionSession); if (status != noErr) { RTC_LOG(LS_ERROR) << "Failed to create decompression session: " << status; [self destroyDecompressionSession]; return WEBRTC_VIDEO_CODEC_ERROR; } [self configureDecompressionSession]; return WEBRTC_VIDEO_CODEC_OK; } - (void)configureDecompressionSession { RTC_DCHECK(_decompressionSession); #if defined(WEBRTC_IOS) VTSessionSetProperty(_decompressionSession, kVTDecompressionPropertyKey_RealTime, kCFBooleanTrue); #endif } - (void)destroyDecompressionSession { if (_decompressionSession) { #if defined(WEBRTC_IOS) VTDecompressionSessionWaitForAsynchronousFrames(_decompressionSession); #endif VTDecompressionSessionInvalidate(_decompressionSession); CFRelease(_decompressionSession); _decompressionSession = nullptr; } } - (void)setVideoFormat:(CMVideoFormatDescriptionRef)videoFormat { if (_videoFormat == videoFormat) { return; } if (_videoFormat) { CFRelease(_videoFormat); } _videoFormat = videoFormat; if (_videoFormat) { CFRetain(_videoFormat); } } - (NSString *)implementationName { return @"VideoToolbox"; } @end