Nagram/TMessagesProj/jni/tgcalls/platform/darwin/TGRTCVideoDecoderH264.mm

/*
 *  Copyright (c) 2015 The WebRTC project authors. All Rights Reserved.
 *
 *  Use of this source code is governed by a BSD-style license
 *  that can be found in the LICENSE file in the root of the source
 *  tree. An additional intellectual property rights grant can be found
 *  in the file PATENTS.  All contributing project authors may
 *  be found in the AUTHORS file in the root of the source tree.
 *
 */

#import "TGRTCVideoDecoderH264.h"

#import <VideoToolbox/VideoToolbox.h>

#import "base/RTCVideoFrame.h"
#import "base/RTCVideoFrameBuffer.h"
#import "components/video_frame_buffer/RTCCVPixelBuffer.h"
#import "helpers.h"
#import "helpers/scoped_cftyperef.h"

#if defined(WEBRTC_IOS)
#import "helpers/UIDevice+RTCDevice.h"
#endif

#include "modules/video_coding/include/video_error_codes.h"
#include "rtc_base/checks.h"
#include "rtc_base/logging.h"
#include "rtc_base/time_utils.h"
#include "sdk/objc/components/video_codec/nalu_rewriter.h"

// Struct that we pass to the decoder per frame to decode. We receive it again
// in the decoder callback.
struct RTCFrameDecodeParams {
  RTCFrameDecodeParams(RTCVideoDecoderCallback cb, int64_t ts) : callback(cb), timestamp(ts) {}
  RTCVideoDecoderCallback callback;
  int64_t timestamp;
};

@interface TGRTCVideoDecoderH264 ()
- (void)setError:(OSStatus)error;
@end

// This is the callback function that VideoToolbox calls when decode is
// complete.
static void decompressionOutputCallback(void *decoderRef,
                                 void *params,
                                 OSStatus status,
                                 VTDecodeInfoFlags infoFlags,
                                 CVImageBufferRef imageBuffer,
                                 CMTime timestamp,
                                 CMTime duration) {
  std::unique_ptr<RTCFrameDecodeParams> decodeParams(
      reinterpret_cast<RTCFrameDecodeParams *>(params));
  if (status != noErr) {
    TGRTCVideoDecoderH264 *decoder = (__bridge TGRTCVideoDecoderH264 *)decoderRef;
    [decoder setError:status];
    RTC_LOG(LS_ERROR) << "Failed to decode frame. Status: " << status;
    return;
  }
  // TODO(tkchin): Handle CVO properly.
  RTCCVPixelBuffer *frameBuffer = [[RTCCVPixelBuffer alloc] initWithPixelBuffer:imageBuffer];
  RTCVideoFrame *decodedFrame =
      [[RTCVideoFrame alloc] initWithBuffer:frameBuffer
                                   rotation:RTCVideoRotation_0
                                timeStampNs:CMTimeGetSeconds(timestamp) * rtc::kNumNanosecsPerSec];
  decodedFrame.timeStamp = (int32_t)decodeParams->timestamp;
  decodeParams->callback(decodedFrame);
}

// Decoder.
@implementation TGRTCVideoDecoderH264 {
  CMVideoFormatDescriptionRef _videoFormat;
  CMMemoryPoolRef _memoryPool;
  VTDecompressionSessionRef _decompressionSession;
  RTCVideoDecoderCallback _callback;
  OSStatus _error;
}

- (instancetype)init {
  self = [super init];
  if (self) {
    _memoryPool = CMMemoryPoolCreate(nil);
  }
  return self;
}

- (void)dealloc {
  CMMemoryPoolInvalidate(_memoryPool);
  CFRelease(_memoryPool);
  [self destroyDecompressionSession];
  [self setVideoFormat:nullptr];
}

- (NSInteger)startDecodeWithNumberOfCores:(int)numberOfCores {
  return WEBRTC_VIDEO_CODEC_OK;
}

- (NSInteger)decode:(RTCEncodedImage *)inputImage
        missingFrames:(BOOL)missingFrames
    codecSpecificInfo:(nullable id<RTCCodecSpecificInfo>)info
         renderTimeMs:(int64_t)renderTimeMs {
  RTC_DCHECK(inputImage.buffer);

  if (_error != noErr) {
    RTC_LOG(LS_WARNING) << "Last frame decode failed.";
    _error = noErr;
    return WEBRTC_VIDEO_CODEC_ERROR;
  }

  rtc::ScopedCFTypeRef<CMVideoFormatDescriptionRef> inputFormat =
      rtc::ScopedCF(webrtc::CreateVideoFormatDescription((uint8_t *)inputImage.buffer.bytes,
                                                         inputImage.buffer.length));
  if (inputFormat) {
    // Check if the video format has changed, and reinitialize decoder if
    // needed.
    if (!CMFormatDescriptionEqual(inputFormat.get(), _videoFormat)) {
      [self setVideoFormat:inputFormat.get()];
      int resetDecompressionSessionError = [self resetDecompressionSession];
      if (resetDecompressionSessionError != WEBRTC_VIDEO_CODEC_OK) {
        return resetDecompressionSessionError;
      }
    }
  }
  if (!_videoFormat) {
    // We received a frame but we don't have format information so we can't
    // decode it.
    // This can happen after backgrounding. We need to wait for the next
    // sps/pps before we can resume so we request a keyframe by returning an
    // error.
    RTC_LOG(LS_WARNING) << "Missing video format. Frame with sps/pps required.";
    return WEBRTC_VIDEO_CODEC_ERROR;
  }
  CMSampleBufferRef sampleBuffer = nullptr;
  if (!webrtc::H264AnnexBBufferToCMSampleBuffer((uint8_t *)inputImage.buffer.bytes,
                                                inputImage.buffer.length,
                                                _videoFormat,
                                                &sampleBuffer,
                                                _memoryPool)) {
    return WEBRTC_VIDEO_CODEC_ERROR;
  }
  RTC_DCHECK(sampleBuffer);
  VTDecodeFrameFlags decodeFlags = kVTDecodeFrame_EnableAsynchronousDecompression;
  std::unique_ptr<RTCFrameDecodeParams> frameDecodeParams;
  frameDecodeParams.reset(new RTCFrameDecodeParams(_callback, inputImage.timeStamp));
  OSStatus status = VTDecompressionSessionDecodeFrame(
      _decompressionSession, sampleBuffer, decodeFlags, frameDecodeParams.release(), nullptr);
#if defined(WEBRTC_IOS)
  // Re-initialize the decoder if we have an invalid session while the app is
  // active or decoder malfunctions and retry the decode request.
  if ((status == kVTInvalidSessionErr || status == kVTVideoDecoderMalfunctionErr) &&
      [self resetDecompressionSession] == WEBRTC_VIDEO_CODEC_OK) {
    RTC_LOG(LS_INFO) << "Failed to decode frame with code: " << status
                     << " retrying decode after decompression session reset";
    frameDecodeParams.reset(new RTCFrameDecodeParams(_callback, inputImage.timeStamp));
    status = VTDecompressionSessionDecodeFrame(
        _decompressionSession, sampleBuffer, decodeFlags, frameDecodeParams.release(), nullptr);
  }
#endif
  CFRelease(sampleBuffer);
  if (status != noErr) {
    RTC_LOG(LS_ERROR) << "Failed to decode frame with code: " << status;
    return WEBRTC_VIDEO_CODEC_ERROR;
  }
  return WEBRTC_VIDEO_CODEC_OK;
}

- (void)setCallback:(RTCVideoDecoderCallback)callback {
  _callback = callback;
}

- (void)setError:(OSStatus)error {
  _error = error;
}

- (NSInteger)releaseDecoder {
  // Need to invalidate the session so that callbacks no longer occur and it
  // is safe to null out the callback.
  [self destroyDecompressionSession];
  [self setVideoFormat:nullptr];
  _callback = nullptr;
  return WEBRTC_VIDEO_CODEC_OK;
}

#pragma mark - Private

- (int)resetDecompressionSession {
  [self destroyDecompressionSession];

  // Need to wait for the first SPS to initialize decoder.
  if (!_videoFormat) {
    return WEBRTC_VIDEO_CODEC_OK;
  }

  // Set keys for OpenGL and IOSurface compatibilty, which makes the encoder
  // create pixel buffers with GPU backed memory. The intent here is to pass
  // the pixel buffers directly so we avoid a texture upload later during
  // rendering. This currently is moot because we are converting back to an
  // I420 frame after decode, but eventually we will be able to plumb
  // CVPixelBuffers directly to the renderer.
  // TODO(tkchin): Maybe only set OpenGL/IOSurface keys if we know that that
  // we can pass CVPixelBuffers as native handles in decoder output.
  static size_t const attributesSize = 3;
  CFTypeRef keys[attributesSize] = {
#if defined(WEBRTC_IOS)
    kCVPixelBufferOpenGLESCompatibilityKey,
#elif defined(WEBRTC_MAC)
    kCVPixelBufferOpenGLCompatibilityKey,
#endif
    kCVPixelBufferIOSurfacePropertiesKey,
    kCVPixelBufferPixelFormatTypeKey
  };
  CFDictionaryRef ioSurfaceValue = CreateCFTypeDictionary(nullptr, nullptr, 0);
  int64_t nv12type = kCVPixelFormatType_420YpCbCr8BiPlanarFullRange;
  CFNumberRef pixelFormat = CFNumberCreate(nullptr, kCFNumberLongType, &nv12type);
  CFTypeRef values[attributesSize] = {kCFBooleanTrue, ioSurfaceValue, pixelFormat};
  CFDictionaryRef attributes = CreateCFTypeDictionary(keys, values, attributesSize);
  if (ioSurfaceValue) {
    CFRelease(ioSurfaceValue);
    ioSurfaceValue = nullptr;
  }
  if (pixelFormat) {
    CFRelease(pixelFormat);
    pixelFormat = nullptr;
  }
  VTDecompressionOutputCallbackRecord record = {
      decompressionOutputCallback, (__bridge void *)self,
  };
  OSStatus status = VTDecompressionSessionCreate(
      nullptr, _videoFormat, nullptr, attributes, &record, &_decompressionSession);
  CFRelease(attributes);
  if (status != noErr) {
    RTC_LOG(LS_ERROR) << "Failed to create decompression session: " << status;
    [self destroyDecompressionSession];
    return WEBRTC_VIDEO_CODEC_ERROR;
  }
  [self configureDecompressionSession];

  return WEBRTC_VIDEO_CODEC_OK;
}

- (void)configureDecompressionSession {
  RTC_DCHECK(_decompressionSession);
#if defined(WEBRTC_IOS)
  VTSessionSetProperty(_decompressionSession, kVTDecompressionPropertyKey_RealTime, kCFBooleanTrue);
#endif
}

- (void)destroyDecompressionSession {
  if (_decompressionSession) {
#if defined(WEBRTC_IOS)
    if ([UIDevice isIOS11OrLater]) {
      VTDecompressionSessionWaitForAsynchronousFrames(_decompressionSession);
    }
#endif
    VTDecompressionSessionInvalidate(_decompressionSession);
    CFRelease(_decompressionSession);
    _decompressionSession = nullptr;
  }
}

- (void)setVideoFormat:(CMVideoFormatDescriptionRef)videoFormat {
  if (_videoFormat == videoFormat) {
    return;
  }
  if (_videoFormat) {
    CFRelease(_videoFormat);
  }
  _videoFormat = videoFormat;
  if (_videoFormat) {
    CFRetain(_videoFormat);
  }
}

- (NSString *)implementationName {
  return @"VideoToolbox";
}

@end
Update to 7.0.0 (2060) 2020-08-14 16:58:22 +00:00			`/*`
			`* Copyright (c) 2015 The WebRTC project authors. All Rights Reserved.`
			`*`
			`* Use of this source code is governed by a BSD-style license`
			`* that can be found in the LICENSE file in the root of the source`
			`* tree. An additional intellectual property rights grant can be found`
			`* in the file PATENTS. All contributing project authors may`
			`* be found in the AUTHORS file in the root of the source tree.`
			`*`
			`*/`

			`#import "TGRTCVideoDecoderH264.h"`

			`#import <VideoToolbox/VideoToolbox.h>`

			`#import "base/RTCVideoFrame.h"`
			`#import "base/RTCVideoFrameBuffer.h"`
			`#import "components/video_frame_buffer/RTCCVPixelBuffer.h"`
			`#import "helpers.h"`
			`#import "helpers/scoped_cftyperef.h"`

			`#if defined(WEBRTC_IOS)`
			`#import "helpers/UIDevice+RTCDevice.h"`
			`#endif`

			`#include "modules/video_coding/include/video_error_codes.h"`
			`#include "rtc_base/checks.h"`
			`#include "rtc_base/logging.h"`
			`#include "rtc_base/time_utils.h"`
			`#include "sdk/objc/components/video_codec/nalu_rewriter.h"`

			`// Struct that we pass to the decoder per frame to decode. We receive it again`
			`// in the decoder callback.`
			`struct RTCFrameDecodeParams {`
			`RTCFrameDecodeParams(RTCVideoDecoderCallback cb, int64_t ts) : callback(cb), timestamp(ts) {}`
			`RTCVideoDecoderCallback callback;`
			`int64_t timestamp;`
			`};`

			`@interface TGRTCVideoDecoderH264 ()`
			`- (void)setError:(OSStatus)error;`
			`@end`

			`// This is the callback function that VideoToolbox calls when decode is`
			`// complete.`
			`static void decompressionOutputCallback(void *decoderRef,`
			`void *params,`
			`OSStatus status,`
			`VTDecodeInfoFlags infoFlags,`
			`CVImageBufferRef imageBuffer,`
			`CMTime timestamp,`
			`CMTime duration) {`
			`std::unique_ptr<RTCFrameDecodeParams> decodeParams(`
			`reinterpret_cast<RTCFrameDecodeParams *>(params));`
			`if (status != noErr) {`
			`TGRTCVideoDecoderH264 decoder = (__bridge TGRTCVideoDecoderH264 )decoderRef;`
			`[decoder setError:status];`
			`RTC_LOG(LS_ERROR) << "Failed to decode frame. Status: " << status;`
			`return;`
			`}`
			`// TODO(tkchin): Handle CVO properly.`
			`RTCCVPixelBuffer *frameBuffer = [[RTCCVPixelBuffer alloc] initWithPixelBuffer:imageBuffer];`
			`RTCVideoFrame *decodedFrame =`
			`[[RTCVideoFrame alloc] initWithBuffer:frameBuffer`
			`rotation:RTCVideoRotation_0`
			`timeStampNs:CMTimeGetSeconds(timestamp) * rtc::kNumNanosecsPerSec];`
			`decodedFrame.timeStamp = (int32_t)decodeParams->timestamp;`
			`decodeParams->callback(decodedFrame);`
			`}`

			`// Decoder.`
			`@implementation TGRTCVideoDecoderH264 {`
			`CMVideoFormatDescriptionRef _videoFormat;`
			`CMMemoryPoolRef _memoryPool;`
			`VTDecompressionSessionRef _decompressionSession;`
			`RTCVideoDecoderCallback _callback;`
			`OSStatus _error;`
			`}`

			`- (instancetype)init {`
			`self = [super init];`
			`if (self) {`
			`_memoryPool = CMMemoryPoolCreate(nil);`
			`}`
			`return self;`
			`}`

			`- (void)dealloc {`
			`CMMemoryPoolInvalidate(_memoryPool);`
			`CFRelease(_memoryPool);`
			`[self destroyDecompressionSession];`
			`[self setVideoFormat:nullptr];`
			`}`

			`- (NSInteger)startDecodeWithNumberOfCores:(int)numberOfCores {`
			`return WEBRTC_VIDEO_CODEC_OK;`
			`}`

			`- (NSInteger)decode:(RTCEncodedImage *)inputImage`
			`missingFrames:(BOOL)missingFrames`
			`codecSpecificInfo:(nullable id<RTCCodecSpecificInfo>)info`
			`renderTimeMs:(int64_t)renderTimeMs {`
			`RTC_DCHECK(inputImage.buffer);`

			`if (_error != noErr) {`
			`RTC_LOG(LS_WARNING) << "Last frame decode failed.";`
			`_error = noErr;`
			`return WEBRTC_VIDEO_CODEC_ERROR;`
			`}`

			`rtc::ScopedCFTypeRef<CMVideoFormatDescriptionRef> inputFormat =`
			`rtc::ScopedCF(webrtc::CreateVideoFormatDescription((uint8_t *)inputImage.buffer.bytes,`
			`inputImage.buffer.length));`
			`if (inputFormat) {`
			`// Check if the video format has changed, and reinitialize decoder if`
			`// needed.`
			`if (!CMFormatDescriptionEqual(inputFormat.get(), _videoFormat)) {`
			`[self setVideoFormat:inputFormat.get()];`
			`int resetDecompressionSessionError = [self resetDecompressionSession];`
			`if (resetDecompressionSessionError != WEBRTC_VIDEO_CODEC_OK) {`
			`return resetDecompressionSessionError;`
			`}`
			`}`
			`}`
			`if (!_videoFormat) {`
			`// We received a frame but we don't have format information so we can't`
			`// decode it.`
			`// This can happen after backgrounding. We need to wait for the next`
			`// sps/pps before we can resume so we request a keyframe by returning an`
			`// error.`
			`RTC_LOG(LS_WARNING) << "Missing video format. Frame with sps/pps required.";`
			`return WEBRTC_VIDEO_CODEC_ERROR;`
			`}`
			`CMSampleBufferRef sampleBuffer = nullptr;`
			`if (!webrtc::H264AnnexBBufferToCMSampleBuffer((uint8_t *)inputImage.buffer.bytes,`
			`inputImage.buffer.length,`
			`_videoFormat,`
			`&sampleBuffer,`
			`_memoryPool)) {`
			`return WEBRTC_VIDEO_CODEC_ERROR;`
			`}`
			`RTC_DCHECK(sampleBuffer);`
			`VTDecodeFrameFlags decodeFlags = kVTDecodeFrame_EnableAsynchronousDecompression;`
			`std::unique_ptr<RTCFrameDecodeParams> frameDecodeParams;`
			`frameDecodeParams.reset(new RTCFrameDecodeParams(_callback, inputImage.timeStamp));`
			`OSStatus status = VTDecompressionSessionDecodeFrame(`
			`_decompressionSession, sampleBuffer, decodeFlags, frameDecodeParams.release(), nullptr);`
			`#if defined(WEBRTC_IOS)`
			`// Re-initialize the decoder if we have an invalid session while the app is`
			`// active or decoder malfunctions and retry the decode request.`
			`if ((status == kVTInvalidSessionErr \|\| status == kVTVideoDecoderMalfunctionErr) &&`
			`[self resetDecompressionSession] == WEBRTC_VIDEO_CODEC_OK) {`
			`RTC_LOG(LS_INFO) << "Failed to decode frame with code: " << status`
			`<< " retrying decode after decompression session reset";`
			`frameDecodeParams.reset(new RTCFrameDecodeParams(_callback, inputImage.timeStamp));`
			`status = VTDecompressionSessionDecodeFrame(`
			`_decompressionSession, sampleBuffer, decodeFlags, frameDecodeParams.release(), nullptr);`
			`}`
			`#endif`
			`CFRelease(sampleBuffer);`
			`if (status != noErr) {`
			`RTC_LOG(LS_ERROR) << "Failed to decode frame with code: " << status;`
			`return WEBRTC_VIDEO_CODEC_ERROR;`
			`}`
			`return WEBRTC_VIDEO_CODEC_OK;`
			`}`

			`- (void)setCallback:(RTCVideoDecoderCallback)callback {`
			`_callback = callback;`
			`}`

			`- (void)setError:(OSStatus)error {`
			`_error = error;`
			`}`

			`- (NSInteger)releaseDecoder {`
			`// Need to invalidate the session so that callbacks no longer occur and it`
			`// is safe to null out the callback.`
			`[self destroyDecompressionSession];`
			`[self setVideoFormat:nullptr];`
			`_callback = nullptr;`
			`return WEBRTC_VIDEO_CODEC_OK;`
			`}`

			`#pragma mark - Private`

			`- (int)resetDecompressionSession {`
			`[self destroyDecompressionSession];`

			`// Need to wait for the first SPS to initialize decoder.`
			`if (!_videoFormat) {`
			`return WEBRTC_VIDEO_CODEC_OK;`
			`}`

			`// Set keys for OpenGL and IOSurface compatibilty, which makes the encoder`
			`// create pixel buffers with GPU backed memory. The intent here is to pass`
			`// the pixel buffers directly so we avoid a texture upload later during`
			`// rendering. This currently is moot because we are converting back to an`
			`// I420 frame after decode, but eventually we will be able to plumb`
			`// CVPixelBuffers directly to the renderer.`
			`// TODO(tkchin): Maybe only set OpenGL/IOSurface keys if we know that that`
			`// we can pass CVPixelBuffers as native handles in decoder output.`
			`static size_t const attributesSize = 3;`
			`CFTypeRef keys[attributesSize] = {`
			`#if defined(WEBRTC_IOS)`
			`kCVPixelBufferOpenGLESCompatibilityKey,`
			`#elif defined(WEBRTC_MAC)`
			`kCVPixelBufferOpenGLCompatibilityKey,`
			`#endif`
			`kCVPixelBufferIOSurfacePropertiesKey,`
			`kCVPixelBufferPixelFormatTypeKey`
			`};`
			`CFDictionaryRef ioSurfaceValue = CreateCFTypeDictionary(nullptr, nullptr, 0);`
			`int64_t nv12type = kCVPixelFormatType_420YpCbCr8BiPlanarFullRange;`
			`CFNumberRef pixelFormat = CFNumberCreate(nullptr, kCFNumberLongType, &nv12type);`
			`CFTypeRef values[attributesSize] = {kCFBooleanTrue, ioSurfaceValue, pixelFormat};`
			`CFDictionaryRef attributes = CreateCFTypeDictionary(keys, values, attributesSize);`
			`if (ioSurfaceValue) {`
			`CFRelease(ioSurfaceValue);`
			`ioSurfaceValue = nullptr;`
			`}`
			`if (pixelFormat) {`
			`CFRelease(pixelFormat);`
			`pixelFormat = nullptr;`
			`}`
			`VTDecompressionOutputCallbackRecord record = {`
			`decompressionOutputCallback, (__bridge void *)self,`
			`};`
			`OSStatus status = VTDecompressionSessionCreate(`
			`nullptr, _videoFormat, nullptr, attributes, &record, &_decompressionSession);`
			`CFRelease(attributes);`
			`if (status != noErr) {`
			`RTC_LOG(LS_ERROR) << "Failed to create decompression session: " << status;`
			`[self destroyDecompressionSession];`
			`return WEBRTC_VIDEO_CODEC_ERROR;`
			`}`
			`[self configureDecompressionSession];`

			`return WEBRTC_VIDEO_CODEC_OK;`
			`}`

			`- (void)configureDecompressionSession {`
			`RTC_DCHECK(_decompressionSession);`
			`#if defined(WEBRTC_IOS)`
			`VTSessionSetProperty(_decompressionSession, kVTDecompressionPropertyKey_RealTime, kCFBooleanTrue);`
			`#endif`
			`}`

			`- (void)destroyDecompressionSession {`
			`if (_decompressionSession) {`
			`#if defined(WEBRTC_IOS)`
			`if ([UIDevice isIOS11OrLater]) {`
			`VTDecompressionSessionWaitForAsynchronousFrames(_decompressionSession);`
			`}`
			`#endif`
			`VTDecompressionSessionInvalidate(_decompressionSession);`
			`CFRelease(_decompressionSession);`
			`_decompressionSession = nullptr;`
			`}`
			`}`

			`- (void)setVideoFormat:(CMVideoFormatDescriptionRef)videoFormat {`
			`if (_videoFormat == videoFormat) {`
			`return;`
			`}`
			`if (_videoFormat) {`
			`CFRelease(_videoFormat);`
			`}`
			`_videoFormat = videoFormat;`
			`if (_videoFormat) {`
			`CFRetain(_videoFormat);`
			`}`
			`}`

			`- (NSString *)implementationName {`
			`return @"VideoToolbox";`
			`}`

			`@end`