/* * Copyright (c) 2014 The WebRTC project authors. All Rights Reserved. * * Use of this source code is governed by a BSD-style license * that can be found in the LICENSE file in the root of the source * tree. An additional intellectual property rights grant can be found * in the file PATENTS. All contributing project authors may * be found in the AUTHORS file in the root of the source tree. */ #include "media/engine/simulcast.h" #include #include #include #include #include "absl/types/optional.h" #include "api/video/video_codec_constants.h" #include "media/base/media_constants.h" #include "modules/video_coding/utility/simulcast_rate_allocator.h" #include "rtc_base/arraysize.h" #include "rtc_base/checks.h" #include "rtc_base/experiments/min_video_bitrate_experiment.h" #include "rtc_base/experiments/normalize_simulcast_size_experiment.h" #include "rtc_base/experiments/rate_control_settings.h" #include "rtc_base/logging.h" #include "system_wrappers/include/field_trial.h" namespace cricket { namespace { constexpr webrtc::DataRate Interpolate(const webrtc::DataRate& a, const webrtc::DataRate& b, float rate) { return a * (1.0 - rate) + b * rate; } constexpr char kUseLegacySimulcastLayerLimitFieldTrial[] = "WebRTC-LegacySimulcastLayerLimit"; // Limits for legacy conference screensharing mode. Currently used for the // lower of the two simulcast streams. constexpr webrtc::DataRate kScreenshareDefaultTl0Bitrate = webrtc::DataRate::KilobitsPerSec(200); constexpr webrtc::DataRate kScreenshareDefaultTl1Bitrate = webrtc::DataRate::KilobitsPerSec(1000); // Min/max bitrate for the higher one of the two simulcast stream used for // screen content. constexpr webrtc::DataRate kScreenshareHighStreamMinBitrate = webrtc::DataRate::KilobitsPerSec(600); constexpr webrtc::DataRate kScreenshareHighStreamMaxBitrate = webrtc::DataRate::KilobitsPerSec(1250); } // namespace struct SimulcastFormat { int width; int height; // The maximum number of simulcast layers can be used for // resolutions at |widthxheigh| for legacy applications. size_t max_layers; // The maximum bitrate for encoding stream at |widthxheight|, when we are // not sending the next higher spatial stream. webrtc::DataRate max_bitrate; // The target bitrate for encoding stream at |widthxheight|, when this layer // is not the highest layer (i.e., when we are sending another higher spatial // stream). webrtc::DataRate target_bitrate; // The minimum bitrate needed for encoding stream at |widthxheight|. webrtc::DataRate min_bitrate; }; // These tables describe from which resolution we can use how many // simulcast layers at what bitrates (maximum, target, and minimum). // Important!! Keep this table from high resolution to low resolution. constexpr const SimulcastFormat kSimulcastFormats[] = { {1920, 1080, 3, webrtc::DataRate::KilobitsPerSec(5000), webrtc::DataRate::KilobitsPerSec(4000), webrtc::DataRate::KilobitsPerSec(800)}, {1280, 720, 3, webrtc::DataRate::KilobitsPerSec(2500), webrtc::DataRate::KilobitsPerSec(2500), webrtc::DataRate::KilobitsPerSec(600)}, {960, 540, 3, webrtc::DataRate::KilobitsPerSec(1200), webrtc::DataRate::KilobitsPerSec(1200), webrtc::DataRate::KilobitsPerSec(350)}, {640, 360, 2, webrtc::DataRate::KilobitsPerSec(700), webrtc::DataRate::KilobitsPerSec(500), webrtc::DataRate::KilobitsPerSec(150)}, {480, 270, 2, webrtc::DataRate::KilobitsPerSec(450), webrtc::DataRate::KilobitsPerSec(350), webrtc::DataRate::KilobitsPerSec(150)}, {320, 180, 1, webrtc::DataRate::KilobitsPerSec(200), webrtc::DataRate::KilobitsPerSec(150), webrtc::DataRate::KilobitsPerSec(30)}, {0, 0, 1, webrtc::DataRate::KilobitsPerSec(200), webrtc::DataRate::KilobitsPerSec(150), webrtc::DataRate::KilobitsPerSec(30)}}; const int kMaxScreenshareSimulcastLayers = 2; // Multiway: Number of temporal layers for each simulcast stream. int DefaultNumberOfTemporalLayers(int simulcast_id, bool screenshare) { RTC_CHECK_GE(simulcast_id, 0); RTC_CHECK_LT(simulcast_id, webrtc::kMaxSimulcastStreams); const int kDefaultNumTemporalLayers = 3; const int kDefaultNumScreenshareTemporalLayers = 2; int default_num_temporal_layers = screenshare ? kDefaultNumScreenshareTemporalLayers : kDefaultNumTemporalLayers; const std::string group_name = screenshare ? webrtc::field_trial::FindFullName( "WebRTC-VP8ScreenshareTemporalLayers") : webrtc::field_trial::FindFullName( "WebRTC-VP8ConferenceTemporalLayers"); if (group_name.empty()) return default_num_temporal_layers; int num_temporal_layers = default_num_temporal_layers; if (sscanf(group_name.c_str(), "%d", &num_temporal_layers) == 1 && num_temporal_layers > 0 && num_temporal_layers <= webrtc::kMaxTemporalStreams) { return num_temporal_layers; } RTC_LOG(LS_WARNING) << "Attempt to set number of temporal layers to " "incorrect value: " << group_name; return default_num_temporal_layers; } int FindSimulcastFormatIndex(int width, int height) { RTC_DCHECK_GE(width, 0); RTC_DCHECK_GE(height, 0); for (uint32_t i = 0; i < arraysize(kSimulcastFormats); ++i) { if (width * height >= kSimulcastFormats[i].width * kSimulcastFormats[i].height) { return i; } } RTC_NOTREACHED(); return -1; } // Round size to nearest simulcast-friendly size. // Simulcast stream width and height must both be dividable by // |2 ^ (simulcast_layers - 1)|. int NormalizeSimulcastSize(int size, size_t simulcast_layers) { int base2_exponent = static_cast(simulcast_layers) - 1; const absl::optional experimental_base2_exponent = webrtc::NormalizeSimulcastSizeExperiment::GetBase2Exponent(); if (experimental_base2_exponent && (size > (1 << *experimental_base2_exponent))) { base2_exponent = *experimental_base2_exponent; } return ((size >> base2_exponent) << base2_exponent); } SimulcastFormat InterpolateSimulcastFormat(int width, int height) { const int index = FindSimulcastFormatIndex(width, height); if (index == 0) return kSimulcastFormats[index]; const int total_pixels_up = kSimulcastFormats[index - 1].width * kSimulcastFormats[index - 1].height; const int total_pixels_down = kSimulcastFormats[index].width * kSimulcastFormats[index].height; const int total_pixels = width * height; const float rate = (total_pixels_up - total_pixels) / static_cast(total_pixels_up - total_pixels_down); size_t max_layers = kSimulcastFormats[index].max_layers; webrtc::DataRate max_bitrate = Interpolate(kSimulcastFormats[index - 1].max_bitrate, kSimulcastFormats[index].max_bitrate, rate); webrtc::DataRate target_bitrate = Interpolate(kSimulcastFormats[index - 1].target_bitrate, kSimulcastFormats[index].target_bitrate, rate); webrtc::DataRate min_bitrate = Interpolate(kSimulcastFormats[index - 1].min_bitrate, kSimulcastFormats[index].min_bitrate, rate); return {width, height, max_layers, max_bitrate, target_bitrate, min_bitrate}; } webrtc::DataRate FindSimulcastMaxBitrate(int width, int height) { return InterpolateSimulcastFormat(width, height).max_bitrate; } webrtc::DataRate FindSimulcastTargetBitrate(int width, int height) { return InterpolateSimulcastFormat(width, height).target_bitrate; } webrtc::DataRate FindSimulcastMinBitrate(int width, int height) { return InterpolateSimulcastFormat(width, height).min_bitrate; } void BoostMaxSimulcastLayer(webrtc::DataRate max_bitrate, std::vector* layers) { if (layers->empty()) return; const webrtc::DataRate total_bitrate = GetTotalMaxBitrate(*layers); // We're still not using all available bits. if (total_bitrate < max_bitrate) { // Spend additional bits to boost the max layer. const webrtc::DataRate bitrate_left = max_bitrate - total_bitrate; layers->back().max_bitrate_bps += bitrate_left.bps(); } } webrtc::DataRate GetTotalMaxBitrate( const std::vector& layers) { if (layers.empty()) return webrtc::DataRate::Zero(); int total_max_bitrate_bps = 0; for (size_t s = 0; s < layers.size() - 1; ++s) { total_max_bitrate_bps += layers[s].target_bitrate_bps; } total_max_bitrate_bps += layers.back().max_bitrate_bps; return webrtc::DataRate::BitsPerSec(total_max_bitrate_bps); } size_t LimitSimulcastLayerCount(int width, int height, size_t need_layers, size_t layer_count) { if (!webrtc::field_trial::IsDisabled( kUseLegacySimulcastLayerLimitFieldTrial)) { size_t adaptive_layer_count = std::max( need_layers, kSimulcastFormats[FindSimulcastFormatIndex(width, height)].max_layers); if (layer_count > adaptive_layer_count) { RTC_LOG(LS_WARNING) << "Reducing simulcast layer count from " << layer_count << " to " << adaptive_layer_count; layer_count = adaptive_layer_count; } } return layer_count; } std::vector GetSimulcastConfig( size_t min_layers, size_t max_layers, int width, int height, double bitrate_priority, int max_qp, bool is_screenshare_with_conference_mode, bool temporal_layers_supported) { RTC_DCHECK_LE(min_layers, max_layers); RTC_DCHECK(max_layers > 1 || is_screenshare_with_conference_mode); const bool base_heavy_tl3_rate_alloc = webrtc::RateControlSettings::ParseFromFieldTrials() .Vp8BaseHeavyTl3RateAllocation(); if (is_screenshare_with_conference_mode) { return GetScreenshareLayers(max_layers, width, height, bitrate_priority, max_qp, temporal_layers_supported, base_heavy_tl3_rate_alloc); } else { // Some applications rely on the old behavior limiting the simulcast layer // count based on the resolution automatically, which they can get through // the WebRTC-LegacySimulcastLayerLimit field trial until they update. max_layers = LimitSimulcastLayerCount(width, height, min_layers, max_layers); return GetNormalSimulcastLayers(max_layers, width, height, bitrate_priority, max_qp, temporal_layers_supported, base_heavy_tl3_rate_alloc); } } std::vector GetNormalSimulcastLayers( size_t layer_count, int width, int height, double bitrate_priority, int max_qp, bool temporal_layers_supported, bool base_heavy_tl3_rate_alloc) { std::vector layers(layer_count); // Format width and height has to be divisible by |2 ^ num_simulcast_layers - // 1|. width = NormalizeSimulcastSize(width, layer_count); height = NormalizeSimulcastSize(height, layer_count); // Add simulcast streams, from highest resolution (|s| = num_simulcast_layers // -1) to lowest resolution at |s| = 0. for (size_t s = layer_count - 1;; --s) { layers[s].width = width; layers[s].height = height; // TODO(pbos): Fill actual temporal-layer bitrate thresholds. layers[s].max_qp = max_qp; layers[s].num_temporal_layers = temporal_layers_supported ? DefaultNumberOfTemporalLayers(s, false) : 1; layers[s].max_bitrate_bps = FindSimulcastMaxBitrate(width, height).bps(); layers[s].target_bitrate_bps = FindSimulcastTargetBitrate(width, height).bps(); int num_temporal_layers = DefaultNumberOfTemporalLayers(s, false); if (s == 0) { // If alternative temporal rate allocation is selected, adjust the // bitrate of the lowest simulcast stream so that absolute bitrate for // the base temporal layer matches the bitrate for the base temporal // layer with the default 3 simulcast streams. Otherwise we risk a // higher threshold for receiving a feed at all. float rate_factor = 1.0; if (num_temporal_layers == 3) { if (base_heavy_tl3_rate_alloc) { // Base heavy allocation increases TL0 bitrate from 40% to 60%. rate_factor = 0.4 / 0.6; } } else { rate_factor = webrtc::SimulcastRateAllocator::GetTemporalRateAllocation( 3, 0, /*base_heavy_tl3_rate_alloc=*/false) / webrtc::SimulcastRateAllocator::GetTemporalRateAllocation( num_temporal_layers, 0, /*base_heavy_tl3_rate_alloc=*/false); } layers[s].max_bitrate_bps = static_cast(layers[s].max_bitrate_bps * rate_factor); layers[s].target_bitrate_bps = static_cast(layers[s].target_bitrate_bps * rate_factor); } layers[s].min_bitrate_bps = FindSimulcastMinBitrate(width, height).bps(); layers[s].max_framerate = kDefaultVideoMaxFramerate; width /= 2; height /= 2; if (s == 0) { break; } } // Currently the relative bitrate priority of the sender is controlled by // the value of the lowest VideoStream. // TODO(bugs.webrtc.org/8630): The web specification describes being able to // control relative bitrate for each individual simulcast layer, but this // is currently just implemented per rtp sender. layers[0].bitrate_priority = bitrate_priority; return layers; } std::vector GetScreenshareLayers( size_t max_layers, int width, int height, double bitrate_priority, int max_qp, bool temporal_layers_supported, bool base_heavy_tl3_rate_alloc) { auto max_screenshare_layers = kMaxScreenshareSimulcastLayers; size_t num_simulcast_layers = std::min(max_layers, max_screenshare_layers); std::vector layers(num_simulcast_layers); // For legacy screenshare in conference mode, tl0 and tl1 bitrates are // piggybacked on the VideoCodec struct as target and max bitrates, // respectively. See eg. webrtc::LibvpxVp8Encoder::SetRates(). layers[0].width = width; layers[0].height = height; layers[0].max_qp = max_qp; layers[0].max_framerate = 5; layers[0].min_bitrate_bps = webrtc::kDefaultMinVideoBitrateBps; layers[0].target_bitrate_bps = kScreenshareDefaultTl0Bitrate.bps(); layers[0].max_bitrate_bps = kScreenshareDefaultTl1Bitrate.bps(); layers[0].num_temporal_layers = temporal_layers_supported ? 2 : 1; // With simulcast enabled, add another spatial layer. This one will have a // more normal layout, with the regular 3 temporal layer pattern and no fps // restrictions. The base simulcast layer will still use legacy setup. if (num_simulcast_layers == kMaxScreenshareSimulcastLayers) { // Add optional upper simulcast layer. const int num_temporal_layers = DefaultNumberOfTemporalLayers(1, true); int max_bitrate_bps; bool using_boosted_bitrate = false; if (!temporal_layers_supported) { // Set the max bitrate to where the base layer would have been if temporal // layers were enabled. max_bitrate_bps = static_cast( kScreenshareHighStreamMaxBitrate.bps() * webrtc::SimulcastRateAllocator::GetTemporalRateAllocation( num_temporal_layers, 0, base_heavy_tl3_rate_alloc)); } else if (DefaultNumberOfTemporalLayers(1, true) != 3 || base_heavy_tl3_rate_alloc) { // Experimental temporal layer mode used, use increased max bitrate. max_bitrate_bps = kScreenshareHighStreamMaxBitrate.bps(); using_boosted_bitrate = true; } else { // Keep current bitrates with default 3tl/8 frame settings. // Lowest temporal layers of a 3 layer setup will have 40% of the total // bitrate allocation for that simulcast layer. Make sure the gap between // the target of the lower simulcast layer and first temporal layer of the // higher one is at most 2x the bitrate, so that upswitching is not // hampered by stalled bitrate estimates. max_bitrate_bps = 2 * ((layers[0].target_bitrate_bps * 10) / 4); } layers[1].width = width; layers[1].height = height; layers[1].max_qp = max_qp; layers[1].max_framerate = kDefaultVideoMaxFramerate; layers[1].num_temporal_layers = temporal_layers_supported ? DefaultNumberOfTemporalLayers(1, true) : 1; layers[1].min_bitrate_bps = using_boosted_bitrate ? kScreenshareHighStreamMinBitrate.bps() : layers[0].target_bitrate_bps * 2; // Cap max bitrate so it isn't overly high for the given resolution. int resolution_limited_bitrate = std::max(FindSimulcastMaxBitrate(width, height).bps(), layers[1].min_bitrate_bps); max_bitrate_bps = std::min(max_bitrate_bps, resolution_limited_bitrate); layers[1].target_bitrate_bps = max_bitrate_bps; layers[1].max_bitrate_bps = max_bitrate_bps; } // The bitrate priority currently implemented on a per-sender level, so we // just set it for the first simulcast layer. layers[0].bitrate_priority = bitrate_priority; return layers; } } // namespace cricket