New FRAME_DURATION VideoFrameMetadata, with Cast Streaming use case.

Adds a new FRAME_DURATION option to VideoFrameMetadata, which can be used by consumers of video frames to improve performance (e.g., encoding quality). This change also adds population of the new metadata by the desktop/tab capture pipeline, and consumption by Cast Streaming's software VP8 encoder. Having accurate frame duration information improves the encoder's ability to choose a compression quality level that better meets the target encode bitrate. Later changes will require this in order to compute resource utilization feedback signals (see bug for details). BUG=156767 Review URL: https://codereview.chromium.org/1146723002 Cr-Commit-Position: refs/heads/master@{#330661}

New FRAME_DURATION VideoFrameMetadata, with Cast Streaming use case.
Adds a new FRAME_DURATION option to VideoFrameMetadata, which can be used by consumers of video frames to improve performance (e.g., encoding quality). This change also adds population of the new metadata by the desktop/tab capture pipeline, and consumption by Cast Streaming's software VP8 encoder. Having accurate frame duration information improves the encoder's ability to choose a compression quality level that better meets the target encode bitrate. Later changes will require this in order to compute resource utilization feedback signals (see bug for details). BUG=156767 Review URL: https://codereview.chromium.org/1146723002 Cr-Commit-Position: refs/heads/master@{#330661}
1cb99158 · miu · Commit bot · 324a1696 · 1cb99158 · 1cb99158
Commit 1cb99158 authored May 19, 2015 by miu Committed by Commit bot May 20, 2015
9 changed files
--- a/content/browser/media/capture/content_video_capture_device_core.cc
+++ b/content/browser/media/capture/content_video_capture_device_core.cc
@@ -135,7 +135,8 @@ bool ThreadSafeCaptureOracle::ObserveEventAndDecideCapture(
                         this,
                         frame_number,
                         base::Passed(&output_buffer),
-                         capture_begin_time);
+                         capture_begin_time,
+                         oracle_.estimated_frame_duration());
  return true;
 }
@@ -167,6 +168,7 @@ void ThreadSafeCaptureOracle::DidCaptureFrame(
    int frame_number,
    scoped_ptr<media::VideoCaptureDevice::Client::Buffer> buffer,
    base::TimeTicks capture_begin_time,
+    base::TimeDelta estimated_frame_duration,
    const scoped_refptr<media::VideoFrame>& frame,
    base::TimeTicks timestamp,
    bool success) {
@@ -180,13 +182,14 @@ void ThreadSafeCaptureOracle::DidCaptureFrame(
  if (success) {
    if (oracle_.CompleteCapture(frame_number, &timestamp)) {
-      // TODO(miu): Use the locked-in frame rate from AnimatedContentSampler.
      frame->metadata()->SetDouble(media::VideoFrameMetadata::FRAME_RATE,
                                   params_.requested_format.frame_rate);
      frame->metadata()->SetTimeTicks(
          media::VideoFrameMetadata::CAPTURE_BEGIN_TIME, capture_begin_time);
      frame->metadata()->SetTimeTicks(
          media::VideoFrameMetadata::CAPTURE_END_TIME, base::TimeTicks::Now());
+      frame->metadata()->SetTimeDelta(media::VideoFrameMetadata::FRAME_DURATION,
+                                      estimated_frame_duration);
      client_->OnIncomingCapturedVideoFrame(buffer.Pass(), frame, timestamp);
    }
  }

--- a/content/browser/media/capture/content_video_capture_device_core.h
+++ b/content/browser/media/capture/content_video_capture_device_core.h
@@ -80,6 +80,7 @@ class ThreadSafeCaptureOracle
      int frame_number,
      scoped_ptr<media::VideoCaptureDevice::Client::Buffer> buffer,
      base::TimeTicks capture_begin_time,
+      base::TimeDelta estimated_frame_duration,
      const scoped_refptr<media::VideoFrame>& frame,
      base::TimeTicks timestamp,
      bool success);

--- a/content/browser/media/capture/video_capture_oracle.cc
+++ b/content/browser/media/capture/video_capture_oracle.cc
@@ -60,20 +60,27 @@ bool VideoCaptureOracle::ObserveEventAndDecideCapture(
  last_event_time_[event] = event_time;
  bool should_sample;
+  duration_of_next_frame_ = base::TimeDelta();
  switch (event) {
    case kCompositorUpdate:
      smoothing_sampler_.ConsiderPresentationEvent(event_time);
      content_sampler_.ConsiderPresentationEvent(damage_rect, event_time);
      if (content_sampler_.HasProposal()) {
        should_sample = content_sampler_.ShouldSample();
-        if (should_sample)
+        if (should_sample) {
          event_time = content_sampler_.frame_timestamp();
+          duration_of_next_frame_ = content_sampler_.sampling_period();
+        }
      } else {
        should_sample = smoothing_sampler_.ShouldSample();
+        if (should_sample)
+          duration_of_next_frame_ = smoothing_sampler_.min_capture_period();
      }
      break;
    default:
      should_sample = smoothing_sampler_.IsOverdueForSamplingAt(event_time);
+      if (should_sample)
+        duration_of_next_frame_ = smoothing_sampler_.min_capture_period();
      break;
  }

--- a/content/browser/media/capture/video_capture_oracle.h
+++ b/content/browser/media/capture/video_capture_oracle.h
@@ -51,6 +51,13 @@ class CONTENT_EXPORT VideoCaptureOracle {
    return smoothing_sampler_.min_capture_period();
  }
+  // Returns the oracle's estimate of the duration of the next frame.  This
+  // should be called just after ObserveEventAndDecideCapture(), and will only
+  // be non-zero if the call returned true.
+  base::TimeDelta estimated_frame_duration() const {
+    return duration_of_next_frame_;
+  }
 private:
  // Retrieve/Assign a frame timestamp by capture |frame_number|.
  base::TimeTicks GetFrameTimestamp(int frame_number) const;
@@ -63,6 +70,11 @@ class CONTENT_EXPORT VideoCaptureOracle {
  // sanity-check that event times are monotonically non-decreasing.
  base::TimeTicks last_event_time_[kNumEvents];
+  // Updated by the last call to ObserveEventAndDecideCapture() with the
+  // estimated duration of the next frame to sample.  This is zero if the method
+  // returned false.
+  base::TimeDelta duration_of_next_frame_;
  // Stores the frame number from the last delivered frame.
  int last_delivered_frame_number_;

--- a/content/browser/media/capture/video_capture_oracle_unittest.cc
+++ b/content/browser/media/capture/video_capture_oracle_unittest.cc
@@ -144,8 +144,11 @@ TEST(VideoCaptureOracleTest, TransitionsSmoothlyBetweenSamplers) {
        t);
    if (require_oracle_says_sample)
      ASSERT_TRUE(oracle_says_sample);
-    if (!oracle_says_sample)
+    if (!oracle_says_sample) {
+      ASSERT_EQ(base::TimeDelta(), oracle.estimated_frame_duration());
      continue;
+    }
+    ASSERT_LT(base::TimeDelta(), oracle.estimated_frame_duration());
    const int frame_number = oracle.RecordCapture();

--- a/media/base/video_frame_metadata.cc
+++ b/media/base/video_frame_metadata.cc
@@ -47,14 +47,27 @@ void VideoFrameMetadata::SetString(Key key, const std::string& value) {
      base::BinaryValue::CreateWithCopiedBuffer(value.data(), value.size()));
 }
-void VideoFrameMetadata::SetTimeTicks(Key key, const base::TimeTicks& value) {
+namespace {
+template<class TimeType>
+void SetTimeValue(VideoFrameMetadata::Key key,
+                  const TimeType& value,
+                  base::DictionaryValue* dictionary) {
  const int64 internal_value = value.ToInternalValue();
-  dictionary_.SetWithoutPathExpansion(
+  dictionary->SetWithoutPathExpansion(
      ToInternalKey(key),
      base::BinaryValue::CreateWithCopiedBuffer(
          reinterpret_cast<const char*>(&internal_value),
          sizeof(internal_value)));
 }
+}  // namespace
+void VideoFrameMetadata::SetTimeDelta(Key key, const base::TimeDelta& value) {
+  SetTimeValue(key, value, &dictionary_);
+}
+void VideoFrameMetadata::SetTimeTicks(Key key, const base::TimeTicks& value) {
+  SetTimeValue(key, value, &dictionary_);
+}
 void VideoFrameMetadata::SetValue(Key key, scoped_ptr<base::Value> value) {
  dictionary_.SetWithoutPathExpansion(ToInternalKey(key), value.Pass());
@@ -83,16 +96,27 @@ bool VideoFrameMetadata::GetString(Key key, std::string* value) const {
  return !!binary_value;
 }
-bool VideoFrameMetadata::GetTimeTicks(Key key, base::TimeTicks* value) const {
+namespace {
+template<class TimeType>
+bool ToTimeValue(const base::BinaryValue& binary_value, TimeType* value) {
  DCHECK(value);
+  int64 internal_value;
+  if (binary_value.GetSize() != sizeof(internal_value))
+    return false;
+  memcpy(&internal_value, binary_value.GetBuffer(), sizeof(internal_value));
+  *value = TimeType::FromInternalValue(internal_value);
+  return true;
+}
+}  // namespace
+bool VideoFrameMetadata::GetTimeDelta(Key key, base::TimeDelta* value) const {
  const base::BinaryValue* const binary_value = GetBinaryValue(key);
-  if (binary_value && binary_value->GetSize() == sizeof(int64)) {
+  return binary_value && ToTimeValue(*binary_value, value);
-    int64 internal_value;
+}
-    memcpy(&internal_value, binary_value->GetBuffer(), sizeof(internal_value));
-    *value = base::TimeTicks::FromInternalValue(internal_value);
+bool VideoFrameMetadata::GetTimeTicks(Key key, base::TimeTicks* value) const {
-    return true;
+  const base::BinaryValue* const binary_value = GetBinaryValue(key);
-  }
+  return binary_value && ToTimeValue(*binary_value, value);
-  return false;
 }
 const base::Value* VideoFrameMetadata::GetValue(Key key) const {

--- a/media/base/video_frame_metadata.h
+++ b/media/base/video_frame_metadata.h
@@ -21,8 +21,19 @@ class MEDIA_EXPORT VideoFrameMetadata {
    CAPTURE_BEGIN_TIME,
    CAPTURE_END_TIME,
+    // The estimated duration of this frame (i.e., the amount of time between
+    // the media timestamp of this frame and the next).  Note that this is not
+    // the same information provided by FRAME_RATE as the FRAME_DURATION can
+    // vary unpredictably for every frame.  Consumers can use this to optimize
+    // playback scheduling, make encoding quality decisions, and/or compute
+    // frame-level resource utilization stats.  Use Get/SetTimeDelta() for this
+    // key.
+    FRAME_DURATION,
    // Represents either the fixed frame rate, or the maximum frame rate to
-    // expect from a variable-rate source.  Use Get/SetDouble() for this key.
+    // expect from a variable-rate source.  This value generally remains the
+    // same for all frames in the same session.  Use Get/SetDouble() for this
+    // key.
    FRAME_RATE,
    NUM_KEYS
@@ -40,6 +51,7 @@ class MEDIA_EXPORT VideoFrameMetadata {
  void SetInteger(Key key, int value);
  void SetDouble(Key key, double value);
  void SetString(Key key, const std::string& value);
+  void SetTimeDelta(Key key, const base::TimeDelta& value);
  void SetTimeTicks(Key key, const base::TimeTicks& value);
  void SetValue(Key key, scoped_ptr<base::Value> value);
@@ -48,6 +60,7 @@ class MEDIA_EXPORT VideoFrameMetadata {
  bool GetInteger(Key key, int* value) const WARN_UNUSED_RESULT;
  bool GetDouble(Key key, double* value) const WARN_UNUSED_RESULT;
  bool GetString(Key key, std::string* value) const WARN_UNUSED_RESULT;
+  bool GetTimeDelta(Key key, base::TimeDelta* value) const WARN_UNUSED_RESULT;
  bool GetTimeTicks(Key key, base::TimeTicks* value) const WARN_UNUSED_RESULT;
  // Returns null if |key| was not present.

--- a/media/base/video_frame_unittest.cc
+++ b/media/base/video_frame_unittest.cc
@@ -378,6 +378,14 @@ TEST(VideoFrameMetadata, SetAndThenGetAllKeysForAllTypes) {
    EXPECT_EQ(base::StringPrintf("\xfe%d\xff", i), string_value);
    metadata.Clear();
+    EXPECT_FALSE(metadata.HasKey(key));
+    metadata.SetTimeDelta(key, base::TimeDelta::FromInternalValue(42 + i));
+    EXPECT_TRUE(metadata.HasKey(key));
+    base::TimeDelta delta_value;
+    EXPECT_TRUE(metadata.GetTimeDelta(key, &delta_value));
+    EXPECT_EQ(base::TimeDelta::FromInternalValue(42 + i), delta_value);
+    metadata.Clear();
    EXPECT_FALSE(metadata.HasKey(key));
    metadata.SetTimeTicks(key, base::TimeTicks::FromInternalValue(~(0LL) + i));
    EXPECT_TRUE(metadata.HasKey(key));

--- a/media/cast/sender/vp8_encoder.cc
+++ b/media/cast/sender/vp8_encoder.cc
@@ -215,20 +215,26 @@ void Vp8Encoder::Encode(const scoped_refptr<media::VideoFrame>& video_frame,
  // The frame duration given to the VP8 codec affects a number of important
  // behaviors, including: per-frame bandwidth, CPU time spent encoding,
  // temporal quality trade-offs, and key/golden/alt-ref frame generation
-  // intervals.  Use the actual amount of time between the current and previous
+  // intervals.  Bound the prediction to account for the fact that the frame
-  // frames as a prediction for the next frame's duration, but bound the
+  // rate can be highly variable, including long pauses in the video stream.
-  // prediction to account for the fact that the frame rate can be highly
-  // variable, including long pauses in the video stream.
  const base::TimeDelta minimum_frame_duration =
      base::TimeDelta::FromSecondsD(1.0 / cast_config_.max_frame_rate);
  const base::TimeDelta maximum_frame_duration =
      base::TimeDelta::FromSecondsD(static_cast<double>(kRestartFramePeriods) /
                                        cast_config_.max_frame_rate);
-  const base::TimeDelta last_frame_duration =
+  base::TimeDelta predicted_frame_duration;
-      video_frame->timestamp() - last_frame_timestamp_;
+  if (!video_frame->metadata()->GetTimeDelta(
-  const base::TimeDelta predicted_frame_duration =
+          media::VideoFrameMetadata::FRAME_DURATION,
+          &predicted_frame_duration) ||
+      predicted_frame_duration <= base::TimeDelta()) {
+    // The source of the video frame did not provide the frame duration.  Use
+    // the actual amount of time between the current and previous frame as a
+    // prediction for the next frame's duration.
+    predicted_frame_duration = video_frame->timestamp() - last_frame_timestamp_;
+  }
+  predicted_frame_duration =
      std::max(minimum_frame_duration,
-               std::min(maximum_frame_duration, last_frame_duration));
+               std::min(maximum_frame_duration, predicted_frame_duration));
  last_frame_timestamp_ = video_frame->timestamp();
  // Encode the frame.  The presentation time stamp argument here is fixed to