Refactor GPU Process Lifetime histogram calls

Use the UMA histogram functions instead of macros for the GPU.ProcessLifetimeEvents.* metrics. This way the histogram calls for the different GPU modes can be combined. Also combine the three crash counters into |recent_crash_count_|, and reset it to zero when a new GPU mode is crashing. The histogram functions are slightly slower than the histogram macros because they don't cache the histogram object at the callsite. These calls are made once during GPU process startup and once following a crash, so they don't occur on a performance critical path. Bug: 1005383, 1030757 Change-Id: I98aee0d50852794270c1c9b4c156e013080d23a3 Reviewed-on: https://chromium-review.googlesource.com/c/chromium/src/+/1961067 Commit-Queue: Sean Gilhuly <sgilhuly@chromium.org> Reviewed-by: Zhenyao Mo <zmo@chromium.org> Reviewed-by: kylechar <kylechar@chromium.org> Cr-Commit-Position: refs/heads/master@{#724719}

Refactor GPU Process Lifetime histogram calls
Use the UMA histogram functions instead of macros for the GPU.ProcessLifetimeEvents.* metrics. This way the histogram calls for the different GPU modes can be combined. Also combine the three crash counters into |recent_crash_count_|, and reset it to zero when a new GPU mode is crashing. The histogram functions are slightly slower than the histogram macros because they don't cache the histogram object at the callsite. These calls are made once during GPU process startup and once following a crash, so they don't occur on a performance critical path. Bug: 1005383, 1030757 Change-Id: I98aee0d50852794270c1c9b4c156e013080d23a3 Reviewed-on: https://chromium-review.googlesource.com/c/chromium/src/+/1961067 Commit-Queue: Sean Gilhuly <sgilhuly@chromium.org> Reviewed-by: Zhenyao Mo <zmo@chromium.org> Reviewed-by: kylechar <kylechar@chromium.org> Cr-Commit-Position: refs/heads/master@{#724719}
269cf4d2 · Sean Gilhuly · Commit Bot · 55fa79a4 · 269cf4d2 · 269cf4d2
Commit 269cf4d2 authored Dec 13, 2019 by Sean Gilhuly Committed by Commit Bot Dec 13, 2019
Hide whitespace changes
Inline Side-by-side

Showing with 56 additions and 56 deletions

content/browser/gpu/gpu_process_host.cc content/browser/gpu/gpu_process_host.cc +49 -49

content/browser/gpu/gpu_process_host.h content/browser/gpu/gpu_process_host.h +7 -7

No files found.
--- a/content/browser/gpu/gpu_process_host.cc
+++ b/content/browser/gpu/gpu_process_host.cc
@@ -107,9 +107,8 @@ namespace content {

 base::subtle::Atomic32 GpuProcessHost::gpu_crash_count_ = 0;
 bool GpuProcessHost::crashed_before_ = false;
-int GpuProcessHost::hardware_accelerated_recent_crash_count_ = 0;
-int GpuProcessHost::swiftshader_recent_crash_count_ = 0;
-int GpuProcessHost::display_compositor_recent_crash_count_ = 0;
+int GpuProcessHost::recent_crash_count_ = 0;
+gpu::GpuMode GpuProcessHost::last_crash_mode_ = gpu::GpuMode::UNKNOWN;

 namespace {

@@ -121,6 +120,21 @@ constexpr char kProcessLifetimeEventsSwiftShader[] =
 constexpr char kProcessLifetimeEventsDisplayCompositor[] =
    "GPU.ProcessLifetimeEvents.DisplayCompositor";

+// Returns the UMA histogram name for the given GPU mode.
+const char* GetProcessLifetimeUmaName(gpu::GpuMode gpu_mode) {
+  switch (gpu_mode) {
+    case gpu::GpuMode::HARDWARE_ACCELERATED:
+      return kProcessLifetimeEventsHardwareAccelerated;
+    case gpu::GpuMode::SWIFTSHADER:
+      return kProcessLifetimeEventsSwiftShader;
+    case gpu::GpuMode::DISPLAY_COMPOSITOR:
+      return kProcessLifetimeEventsDisplayCompositor;
+    default:
+      NOTREACHED();
+      return nullptr;
+  }
+}
+
 // Forgive one GPU process crash after this many minutes.
 constexpr int kForgiveGpuCrashMinutes = 60;

@@ -128,6 +142,12 @@ constexpr int kForgiveGpuCrashMinutes = 60;
 // the display compositor, after this many minutes.
 constexpr int kForgiveDisplayCompositorCrashMinutes = 10;

+int GetForgiveMinutes(gpu::GpuMode gpu_mode) {
+  return gpu_mode == gpu::GpuMode::DISPLAY_COMPOSITOR
+             ? kForgiveDisplayCompositorCrashMinutes
+             : kForgiveGpuCrashMinutes;
+}
+
 #if !defined(OS_ANDROID)
 // Feature controlling whether or not memory pressure signals will be forwarded
 // to the GPU process.
@@ -613,24 +633,31 @@ int GpuProcessHost::GetGpuCrashCount() {
 }

 // static
-void GpuProcessHost::IncrementCrashCount(int forgive_minutes,
-                                         int* crash_count) {
+void GpuProcessHost::IncrementCrashCount(gpu::GpuMode gpu_mode) {
+  int forgive_minutes = GetForgiveMinutes(gpu_mode);
  DCHECK_GT(forgive_minutes, 0);

  // Last time the process crashed.
  static base::TimeTicks last_crash_time;

-  // Remove one crash per |forgive_minutes| from the crash count, so occasional
-  // crashes won't add up and eventually prevent using the GPU process.
  base::TimeTicks current_time = base::TimeTicks::Now();
-  if (crashed_before_) {
+  if (gpu_mode != last_crash_mode_) {
+    // Reset the crash count when the GPU starts crashing in a different mode.
+    recent_crash_count_ = 0;
+  } else if (crashed_before_) {
+    // Remove one crash per |forgive_minutes| from the crash count, so
+    // occasional crashes won't add up and eventually prevent using the GPU
+    // process.
    int minutes_delta = (current_time - last_crash_time).InMinutes();
    int crashes_to_forgive = minutes_delta / forgive_minutes;
-    *crash_count = std::max(0, *crash_count - crashes_to_forgive);
+    recent_crash_count_ = std::max(0, recent_crash_count_ - crashes_to_forgive);
  }
-  ++(*crash_count);
+  recent_crash_count_ =
+      std::min(recent_crash_count_ + 1,
+               static_cast<int>(GPU_PROCESS_LIFETIME_EVENT_MAX) - 1);

  crashed_before_ = true;
+  last_crash_mode_ = gpu_mode;
  last_crash_time = current_time;
 }

@@ -965,7 +992,7 @@ void GpuProcessHost::DidInitialize(
  // Android may kill the GPU process to free memory, especially when the app
  // is the background, so Android cannot have a hard limit on GPU starts.
  // Reset crash count on Android when context creation succeeds.
-  hardware_accelerated_recent_crash_count_ = 0;
+  recent_crash_count_ = 0;
 #endif
 }

@@ -980,7 +1007,7 @@ void GpuProcessHost::DidCreateContextSuccessfully() {
  // Android may kill the GPU process to free memory, especially when the app
  // is the background, so Android cannot have a hard limit on GPU starts.
  // Reset crash count on Android when context creation succeeds.
-  hardware_accelerated_recent_crash_count_ = 0;
+  recent_crash_count_ = 0;
 #endif
 }

@@ -1136,16 +1163,8 @@ bool GpuProcessHost::LaunchGpuProcess() {
  process_launched_ = true;

  if (kind_ == GPU_PROCESS_KIND_SANDBOXED) {
-    if (mode_ == gpu::GpuMode::HARDWARE_ACCELERATED) {
-      UMA_HISTOGRAM_ENUMERATION(kProcessLifetimeEventsHardwareAccelerated,
-                                LAUNCHED, GPU_PROCESS_LIFETIME_EVENT_MAX);
-    } else if (mode_ == gpu::GpuMode::SWIFTSHADER) {
-      UMA_HISTOGRAM_ENUMERATION(kProcessLifetimeEventsSwiftShader, LAUNCHED,
-                                GPU_PROCESS_LIFETIME_EVENT_MAX);
-    } else if (mode_ == gpu::GpuMode::DISPLAY_COMPOSITOR) {
-      UMA_HISTOGRAM_ENUMERATION(kProcessLifetimeEventsDisplayCompositor,
-                                LAUNCHED, GPU_PROCESS_LIFETIME_EVENT_MAX);
-    }
+    base::UmaHistogramEnumeration(GetProcessLifetimeUmaName(mode_), LAUNCHED,
+                                  GPU_PROCESS_LIFETIME_EVENT_MAX);
  }

  return true;
@@ -1181,32 +1200,13 @@ void GpuProcessHost::RecordProcessCrash() {
  LOG(WARNING) << "The GPU process has crashed " << GetGpuCrashCount()
               << " time(s)";

-  int recent_crash_count = 0;
-  if (mode_ == gpu::GpuMode::HARDWARE_ACCELERATED) {
-    IncrementCrashCount(kForgiveGpuCrashMinutes,
-                        &hardware_accelerated_recent_crash_count_);
-    UMA_HISTOGRAM_EXACT_LINEAR(
-        kProcessLifetimeEventsHardwareAccelerated,
-        DIED_FIRST_TIME + hardware_accelerated_recent_crash_count_ - 1,
-        static_cast<int>(GPU_PROCESS_LIFETIME_EVENT_MAX));
-    recent_crash_count = hardware_accelerated_recent_crash_count_;
-  } else if (mode_ == gpu::GpuMode::SWIFTSHADER) {
-    IncrementCrashCount(kForgiveGpuCrashMinutes,
-                        &swiftshader_recent_crash_count_);
-    UMA_HISTOGRAM_EXACT_LINEAR(
-        kProcessLifetimeEventsSwiftShader,
-        DIED_FIRST_TIME + swiftshader_recent_crash_count_ - 1,
-        static_cast<int>(GPU_PROCESS_LIFETIME_EVENT_MAX));
-    recent_crash_count = swiftshader_recent_crash_count_;
-  } else if (mode_ == gpu::GpuMode::DISPLAY_COMPOSITOR) {
-    IncrementCrashCount(kForgiveDisplayCompositorCrashMinutes,
-                        &display_compositor_recent_crash_count_);
-    UMA_HISTOGRAM_EXACT_LINEAR(
-        kProcessLifetimeEventsDisplayCompositor,
-        DIED_FIRST_TIME + display_compositor_recent_crash_count_ - 1,
-        static_cast<int>(GPU_PROCESS_LIFETIME_EVENT_MAX));
-    recent_crash_count = display_compositor_recent_crash_count_;
-  }
+  // It's possible GPU mode fallback has already happened. In this case, |mode_|
+  // will still be the mode of the failed process.
+  IncrementCrashCount(mode_);
+  base::UmaHistogramExactLinear(
+      GetProcessLifetimeUmaName(mode_),
+      DIED_FIRST_TIME + recent_crash_count_ - 1,
+      static_cast<int>(GPU_PROCESS_LIFETIME_EVENT_MAX));

  // GPU process initialization failed and fallback already happened.
  if (did_fail_initialize_)
@@ -1217,7 +1217,7 @@ void GpuProcessHost::RecordProcessCrash() {

  // GPU process crashed too many times, fallback on a different GPU process
  // mode.
-  if (recent_crash_count >= kGpuFallbackCrashCount && !disable_crash_limit)
+  if (recent_crash_count_ >= kGpuFallbackCrashCount && !disable_crash_limit)
    GpuDataManagerImpl::GetInstance()->FallBackToNextGpuMode();
 }


--- a/content/browser/gpu/gpu_process_host.h
+++ b/content/browser/gpu/gpu_process_host.h
@@ -119,10 +119,11 @@ class GpuProcessHost : public BrowserChildProcessHostDelegate,

  static bool ValidateHost(GpuProcessHost* host);

-  // Increments |crash_count| by one. Before incrementing |crash_count|, for
-  // each |forgive_minutes| that has passed since the previous crash remove one
-  // old crash.
-  static void IncrementCrashCount(int forgive_minutes, int* crash_count);
+  // Increments |recent_crash_count_| by one. Before incrementing, remove one
+  // old crash for each forgiveness interval that has passed since the previous
+  // crash. If |gpu_mode| doesn't match |last_crash_mode_|, first reset the
+  // crash count.
+  static void IncrementCrashCount(gpu::GpuMode gpu_mode);

  GpuProcessHost(int host_id, GpuProcessKind kind);
  ~GpuProcessHost() override;
@@ -223,9 +224,8 @@ class GpuProcessHost : public BrowserChildProcessHostDelegate,
  // The total number of GPU process crashes.
  static base::subtle::Atomic32 gpu_crash_count_;
  static bool crashed_before_;
-  static int hardware_accelerated_recent_crash_count_;
-  static int swiftshader_recent_crash_count_;
-  static int display_compositor_recent_crash_count_;
+  static int recent_crash_count_;
+  static gpu::GpuMode last_crash_mode_;

  // Here the bottom-up destruction order matters:
  // The GPU thread depends on its host so stop the host last.