forked from mirrors/gecko-dev
		
	This patch wants to solve several quirks around the shutdown terminator. - Use the same shutdown phase definitions in AppShutdown and nsTerminator. This touches quite a few files. - Ensure that the terminator phase shift is handled before any shutdown observer notifications are sent and reduce its heartbeat duration. - Add missing phases to the shutdown telemetry. Please note that this changes the unit of "tick" to 100ms rather than 1s. As a side effect, we also remove the obsolete "shutdown-persist" context. While the existing test coverage continues to prove the most important functions, we acknowledge the wish for better test coverage with [[ https://bugzilla.mozilla.org/show_bug.cgi?id=1693966 | bug 1693966 ]]. Differential Revision: https://phabricator.services.mozilla.com/D103626
		
			
				
	
	
		
			608 lines
		
	
	
	
		
			20 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			608 lines
		
	
	
	
		
			20 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
/* -*- Mode: C++; tab-width: 8; indent-tabs-mode: nil; c-basic-offset: 2 -*-
 | 
						|
 * vim: sw=2 ts=2 et lcs=trail\:.,tab\:>~ :
 | 
						|
 * This Source Code Form is subject to the terms of the Mozilla Public
 | 
						|
 * License, v. 2.0. If a copy of the MPL was not distributed with this
 | 
						|
 * file, You can obtain one at http://mozilla.org/MPL/2.0/. */
 | 
						|
 | 
						|
/**
 | 
						|
 * A watchdog designed to terminate shutdown if it lasts too long.
 | 
						|
 *
 | 
						|
 * This watchdog is designed as a worst-case problem container for the
 | 
						|
 * common case in which Firefox just won't shutdown.
 | 
						|
 *
 | 
						|
 * We spawn a thread during quit-application. If any of the shutdown
 | 
						|
 * steps takes more than n milliseconds (63000 by default), kill the
 | 
						|
 * process as fast as possible, without any cleanup.
 | 
						|
 */
 | 
						|
 | 
						|
#include "mozilla/ShutdownPhase.h"
 | 
						|
#include "nsTerminator.h"
 | 
						|
 | 
						|
#include "prthread.h"
 | 
						|
#include "prmon.h"
 | 
						|
#include "plstr.h"
 | 
						|
#include "prio.h"
 | 
						|
 | 
						|
#include "nsString.h"
 | 
						|
#include "nsServiceManagerUtils.h"
 | 
						|
#include "nsDirectoryServiceUtils.h"
 | 
						|
#include "nsAppDirectoryServiceDefs.h"
 | 
						|
 | 
						|
#include "nsIObserverService.h"
 | 
						|
#include "nsExceptionHandler.h"
 | 
						|
#include "GeckoProfiler.h"
 | 
						|
#include "nsThreadUtils.h"
 | 
						|
#include "nsXULAppAPI.h"
 | 
						|
 | 
						|
#if defined(XP_WIN)
 | 
						|
#  include <windows.h>
 | 
						|
#else
 | 
						|
#  include <unistd.h>
 | 
						|
#endif
 | 
						|
 | 
						|
#include "mozilla/AppShutdown.h"
 | 
						|
#include "mozilla/ArrayUtils.h"
 | 
						|
#include "mozilla/Atomics.h"
 | 
						|
#include "mozilla/Attributes.h"
 | 
						|
#include "mozilla/DebugOnly.h"
 | 
						|
#include "mozilla/IntentionalCrash.h"
 | 
						|
#include "mozilla/MemoryChecking.h"
 | 
						|
#include "mozilla/Preferences.h"
 | 
						|
#include "mozilla/Services.h"
 | 
						|
#include "mozilla/UniquePtr.h"
 | 
						|
#include "mozilla/Unused.h"
 | 
						|
#include "mozilla/Telemetry.h"
 | 
						|
 | 
						|
#include "mozilla/dom/IOUtils.h"
 | 
						|
#include "mozilla/dom/workerinternals/RuntimeService.h"
 | 
						|
 | 
						|
// Normally, the number of milliseconds that AsyncShutdown waits until
 | 
						|
// it decides to crash is specified as a preference. We use the
 | 
						|
// following value as a fallback if for some reason the preference is
 | 
						|
// absent.
 | 
						|
#define FALLBACK_ASYNCSHUTDOWN_CRASH_AFTER_MS 60000
 | 
						|
 | 
						|
// Additional number of milliseconds to wait until we decide to exit
 | 
						|
// forcefully.
 | 
						|
#define ADDITIONAL_WAIT_BEFORE_CRASH_MS 3000
 | 
						|
 | 
						|
#define HEARTBEAT_INTERVAL_MS 100
 | 
						|
 | 
						|
namespace mozilla {
 | 
						|
 | 
						|
namespace {
 | 
						|
 | 
						|
/**
 | 
						|
 * A step during shutdown.
 | 
						|
 *
 | 
						|
 * Shutdown is divided in steps, which all map to an observer
 | 
						|
 * notification. The duration of a step is defined as the number of
 | 
						|
 * ticks between the time we receive a notification and the next one.
 | 
						|
 */
 | 
						|
struct ShutdownStep {
 | 
						|
  mozilla::ShutdownPhase mPhase;
 | 
						|
  int mTicks;
 | 
						|
 | 
						|
  constexpr explicit ShutdownStep(mozilla::ShutdownPhase aPhase)
 | 
						|
      : mPhase(aPhase), mTicks(-1) {}
 | 
						|
};
 | 
						|
 | 
						|
static ShutdownStep sShutdownSteps[] = {
 | 
						|
    ShutdownStep(mozilla::ShutdownPhase::AppShutdownConfirmed),
 | 
						|
    ShutdownStep(mozilla::ShutdownPhase::AppShutdownNetTeardown),
 | 
						|
    ShutdownStep(mozilla::ShutdownPhase::AppShutdownTeardown),
 | 
						|
    ShutdownStep(mozilla::ShutdownPhase::AppShutdown),
 | 
						|
    ShutdownStep(mozilla::ShutdownPhase::AppShutdownQM),
 | 
						|
    ShutdownStep(mozilla::ShutdownPhase::XPCOMWillShutdown),
 | 
						|
    ShutdownStep(mozilla::ShutdownPhase::XPCOMShutdown),
 | 
						|
};
 | 
						|
 | 
						|
Atomic<bool> sShutdownNotified;
 | 
						|
 | 
						|
int GetStepForPhase(mozilla::ShutdownPhase aPhase) {
 | 
						|
  for (size_t i = 0; i < std::size(sShutdownSteps); i++) {
 | 
						|
    if (sShutdownSteps[i].mPhase >= aPhase) {
 | 
						|
      return (int)i;
 | 
						|
    }
 | 
						|
  }
 | 
						|
  return -1;
 | 
						|
}
 | 
						|
 | 
						|
// Utility function: create a thread that is non-joinable,
 | 
						|
// does not prevent the process from terminating, is never
 | 
						|
// cooperatively scheduled, and uses a default stack size.
 | 
						|
PRThread* CreateSystemThread(void (*start)(void* arg), void* arg) {
 | 
						|
  PRThread* thread =
 | 
						|
      PR_CreateThread(PR_SYSTEM_THREAD, /* This thread will not prevent the
 | 
						|
                                           process from terminating */
 | 
						|
                      start, arg, PR_PRIORITY_LOW,
 | 
						|
                      PR_GLOBAL_THREAD, /* Make sure that the thread is never
 | 
						|
                                           cooperatively scheduled */
 | 
						|
                      PR_UNJOINABLE_THREAD, 0 /* Use default stack size */
 | 
						|
      );
 | 
						|
  MOZ_LSAN_INTENTIONALLY_LEAK_OBJECT(
 | 
						|
      thread);  // This pointer will never be deallocated.
 | 
						|
  return thread;
 | 
						|
}
 | 
						|
 | 
						|
////////////////////////////////////////////
 | 
						|
//
 | 
						|
// The watchdog
 | 
						|
//
 | 
						|
// This nspr thread is in charge of crashing the process if any stage of
 | 
						|
// shutdown lasts more than some predefined duration. As a side-effect, it
 | 
						|
// measures the duration of each stage of shutdown.
 | 
						|
//
 | 
						|
 | 
						|
// The heartbeat of the operation.
 | 
						|
//
 | 
						|
// Main thread:
 | 
						|
//
 | 
						|
// * Whenever a shutdown step has been completed, the main thread
 | 
						|
// swaps gHeartbeat to 0 to mark that the shutdown process is still
 | 
						|
// progressing. The value swapped away indicates the number of ticks
 | 
						|
// it took for the shutdown step to advance.
 | 
						|
//
 | 
						|
// Watchdog thread:
 | 
						|
//
 | 
						|
// * Every tick, the watchdog thread increments gHearbeat atomically.
 | 
						|
//
 | 
						|
// A note about precision:
 | 
						|
// Since gHeartbeat is generally reset to 0 between two ticks, this means
 | 
						|
// that gHeartbeat stays at 0 less than one tick. Consequently, values
 | 
						|
// extracted from gHeartbeat must be considered rounded up.
 | 
						|
Atomic<uint32_t> gHeartbeat(0);
 | 
						|
 | 
						|
struct Options {
 | 
						|
  /**
 | 
						|
   * How many ticks before we should crash the process.
 | 
						|
   */
 | 
						|
  uint32_t crashAfterTicks;
 | 
						|
};
 | 
						|
 | 
						|
/**
 | 
						|
 * Entry point for the watchdog thread
 | 
						|
 */
 | 
						|
void RunWatchdog(void* arg) {
 | 
						|
  NS_SetCurrentThreadName("Shutdown Hang Terminator");
 | 
						|
 | 
						|
  // Let's copy and deallocate options, that's one less leak to worry
 | 
						|
  // about.
 | 
						|
  UniquePtr<Options> options((Options*)arg);
 | 
						|
  uint32_t crashAfterTicks = options->crashAfterTicks;
 | 
						|
  options = nullptr;
 | 
						|
 | 
						|
  const uint32_t timeToLive = crashAfterTicks;
 | 
						|
  while (true) {
 | 
						|
    //
 | 
						|
    // We do not want to sleep for the entire duration,
 | 
						|
    // as putting the computer to sleep would suddenly
 | 
						|
    // cause us to timeout on wakeup.
 | 
						|
    //
 | 
						|
    // Rather, we prefer sleeping for at most 1 second
 | 
						|
    // at a time. If the computer sleeps then wakes up,
 | 
						|
    // we have lost at most one second, which is much
 | 
						|
    // more reasonable.
 | 
						|
    //
 | 
						|
#if defined(XP_WIN)
 | 
						|
    Sleep(HEARTBEAT_INTERVAL_MS /* ms */);
 | 
						|
#else
 | 
						|
    usleep(HEARTBEAT_INTERVAL_MS * 1000 /* usec */);
 | 
						|
#endif
 | 
						|
 | 
						|
    if (gHeartbeat++ < timeToLive) {
 | 
						|
      continue;
 | 
						|
    }
 | 
						|
 | 
						|
    NoteIntentionalCrash(XRE_GetProcessTypeString());
 | 
						|
 | 
						|
    // The shutdown steps are not completed yet. Let's report the last one.
 | 
						|
    if (!sShutdownNotified) {
 | 
						|
      mozilla::ShutdownPhase lastStep = mozilla::ShutdownPhase::NotInShutdown;
 | 
						|
      // Looping inverse here to make the search more robust in case
 | 
						|
      // the observer that triggers UpdateHeartbeat was not called
 | 
						|
      // at all or in the expected order on some step. This should
 | 
						|
      // give us always the last known ShutdownStep.
 | 
						|
      for (int i = ArrayLength(sShutdownSteps) - 1; i >= 0; --i) {
 | 
						|
        if (sShutdownSteps[i].mTicks > -1) {
 | 
						|
          lastStep = sShutdownSteps[i].mPhase;
 | 
						|
          break;
 | 
						|
        }
 | 
						|
      }
 | 
						|
 | 
						|
      if (lastStep != mozilla::ShutdownPhase::NotInShutdown) {
 | 
						|
        nsCString msg;
 | 
						|
        msg.AppendPrintf(
 | 
						|
            "Shutdown hanging at step %s. "
 | 
						|
            "Something is blocking the main-thread.",
 | 
						|
            mozilla::AppShutdown::GetObserverKey(lastStep));
 | 
						|
        // This string will be leaked.
 | 
						|
        MOZ_CRASH_UNSAFE(strdup(msg.BeginReading()));
 | 
						|
      }
 | 
						|
 | 
						|
      MOZ_CRASH("Shutdown hanging before starting any known phase.");
 | 
						|
    }
 | 
						|
 | 
						|
    // Maybe some workers are blocking the shutdown.
 | 
						|
    mozilla::dom::workerinternals::RuntimeService* runtimeService =
 | 
						|
        mozilla::dom::workerinternals::RuntimeService::GetService();
 | 
						|
    if (runtimeService) {
 | 
						|
      runtimeService->CrashIfHanging();
 | 
						|
    }
 | 
						|
 | 
						|
    // If we get here, we know that all shutdown phases have been
 | 
						|
    // finished successfully and no worker is hanging.
 | 
						|
    // Therefore there should be nothing left worth waiting for.
 | 
						|
    // We give us a short extra time in case we have a late race
 | 
						|
    // and are about to have a clean shutdown anyway.
 | 
						|
#if defined(XP_WIN)
 | 
						|
    Sleep(1000 /* ms */);
 | 
						|
#else
 | 
						|
    usleep(1000000 /* usec */);
 | 
						|
#endif
 | 
						|
 | 
						|
    // If we are still alive then we just crash.
 | 
						|
    CrashReporter::SetMinidumpAnalysisAllThreads();
 | 
						|
    MOZ_CRASH("Shutdown hanging after all known phases and workers finished.");
 | 
						|
  }
 | 
						|
}
 | 
						|
 | 
						|
////////////////////////////////////////////
 | 
						|
//
 | 
						|
// Writer thread
 | 
						|
//
 | 
						|
// This nspr thread is in charge of writing to disk statistics produced by the
 | 
						|
// watchdog thread and collected by the main thread. Note that we use a nspr
 | 
						|
// thread rather than usual XPCOM I/O simply because we outlive XPCOM and its
 | 
						|
// threads.
 | 
						|
//
 | 
						|
 | 
						|
//
 | 
						|
// Communication between the main thread and the writer thread.
 | 
						|
//
 | 
						|
// Main thread:
 | 
						|
//
 | 
						|
// * Whenever a shutdown step has been completed, the main thread
 | 
						|
// obtains the number of ticks from the watchdog threads, builds
 | 
						|
// a string representing all the data gathered so far, places
 | 
						|
// this string in `gWriteData`, and wakes up the writer thread
 | 
						|
// using `gWriteReady`. If `gWriteData` already contained a non-null
 | 
						|
// pointer, this means that the writer thread is lagging behind the
 | 
						|
// main thread, and the main thread cleans up the memory.
 | 
						|
//
 | 
						|
// Writer thread:
 | 
						|
//
 | 
						|
// * When awake, the writer thread swaps `gWriteData` to nullptr. If
 | 
						|
// `gWriteData` contained data to write, the . If so, the writer
 | 
						|
// thread writes the data to a file named "ShutdownDuration.json.tmp",
 | 
						|
// then moves that file to "ShutdownDuration.json" and cleans up the
 | 
						|
// data. If `gWriteData` contains a nullptr, the writer goes to sleep
 | 
						|
// until it is awkened using `gWriteReady`.
 | 
						|
//
 | 
						|
//
 | 
						|
// The data written by the writer thread will be read by another
 | 
						|
// module upon the next restart and fed to Telemetry.
 | 
						|
//
 | 
						|
Atomic<nsCString*> gWriteData(nullptr);
 | 
						|
PRMonitor* gWriteReady = nullptr;
 | 
						|
 | 
						|
void RunWriter(void* arg) {
 | 
						|
  AUTO_PROFILER_REGISTER_THREAD("Shutdown Statistics Writer");
 | 
						|
  NS_SetCurrentThreadName("Shutdown Statistics Writer");
 | 
						|
 | 
						|
  MOZ_LSAN_INTENTIONALLY_LEAK_OBJECT(arg);
 | 
						|
  // Shutdown will generally complete before we have a chance to
 | 
						|
  // deallocate. This is not a leak.
 | 
						|
 | 
						|
  // Setup destinationPath and tmpFilePath
 | 
						|
 | 
						|
  nsCString destinationPath;
 | 
						|
  destinationPath.Adopt(static_cast<char*>(arg));
 | 
						|
  nsAutoCString tmpFilePath;
 | 
						|
  tmpFilePath.Append(destinationPath);
 | 
						|
  tmpFilePath.AppendLiteral(".tmp");
 | 
						|
 | 
						|
  // Cleanup any file leftover from a previous run
 | 
						|
  Unused << PR_Delete(tmpFilePath.get());
 | 
						|
  Unused << PR_Delete(destinationPath.get());
 | 
						|
 | 
						|
  while (true) {
 | 
						|
    //
 | 
						|
    // Check whether we have received data from the main thread.
 | 
						|
    //
 | 
						|
    // We perform the check before waiting on `gWriteReady` as we may
 | 
						|
    // have received data while we were busy writing.
 | 
						|
    //
 | 
						|
    // Also note that gWriteData may have been modified several times
 | 
						|
    // since we last checked. That's ok, we are not losing any important
 | 
						|
    // data (since we keep adding data), and we are not leaking memory
 | 
						|
    // (since the main thread deallocates any data that hasn't been
 | 
						|
    // consumed by the writer thread).
 | 
						|
    //
 | 
						|
    UniquePtr<nsCString> data(gWriteData.exchange(nullptr));
 | 
						|
    if (!data) {
 | 
						|
      // Data is not available yet.
 | 
						|
      // Wait until the main thread provides it.
 | 
						|
      PR_EnterMonitor(gWriteReady);
 | 
						|
      PR_Wait(gWriteReady, PR_INTERVAL_NO_TIMEOUT);
 | 
						|
      PR_ExitMonitor(gWriteReady);
 | 
						|
      continue;
 | 
						|
    }
 | 
						|
 | 
						|
    MOZ_LSAN_INTENTIONALLY_LEAK_OBJECT(data.get());
 | 
						|
    // Shutdown may complete before we have a chance to deallocate.
 | 
						|
    // This is not a leak.
 | 
						|
 | 
						|
    //
 | 
						|
    // Write to a temporary file
 | 
						|
    //
 | 
						|
    // In case of any error, we simply give up. Since the data is
 | 
						|
    // hardly critical, we don't want to spend too much effort
 | 
						|
    // salvaging it.
 | 
						|
    //
 | 
						|
    UniquePtr<PRFileDesc, PR_CloseDelete> tmpFileDesc(PR_Open(
 | 
						|
        tmpFilePath.get(), PR_WRONLY | PR_TRUNCATE | PR_CREATE_FILE, 00600));
 | 
						|
 | 
						|
    // Shutdown may complete before we have a chance to close the file.
 | 
						|
    // This is not a leak.
 | 
						|
    MOZ_LSAN_INTENTIONALLY_LEAK_OBJECT(tmpFileDesc.get());
 | 
						|
 | 
						|
    if (tmpFileDesc == nullptr) {
 | 
						|
      break;
 | 
						|
    }
 | 
						|
    if (PR_Write(tmpFileDesc.get(), data->get(), data->Length()) == -1) {
 | 
						|
      break;
 | 
						|
    }
 | 
						|
    tmpFileDesc.reset();
 | 
						|
 | 
						|
    //
 | 
						|
    // Rename on top of destination file.
 | 
						|
    //
 | 
						|
    // This is not sufficient to guarantee that the destination file
 | 
						|
    // will be written correctly, but, again, we don't care enough
 | 
						|
    // about the data to make more efforts.
 | 
						|
    //
 | 
						|
    Unused << PR_Delete(destinationPath.get());
 | 
						|
    if (PR_Rename(tmpFilePath.get(), destinationPath.get()) != PR_SUCCESS) {
 | 
						|
      break;
 | 
						|
    }
 | 
						|
  }
 | 
						|
}
 | 
						|
 | 
						|
}  // namespace
 | 
						|
 | 
						|
NS_IMPL_ISUPPORTS(nsTerminator, nsIObserver)
 | 
						|
 | 
						|
nsTerminator::nsTerminator() : mInitialized(false), mCurrentStep(-1) {}
 | 
						|
 | 
						|
// Actually launch these threads. This takes place at the first sign of
 | 
						|
// shutdown.
 | 
						|
void nsTerminator::Start() {
 | 
						|
  MOZ_ASSERT(!mInitialized);
 | 
						|
  sShutdownNotified = false;
 | 
						|
  StartWatchdog();
 | 
						|
#if !defined(NS_FREE_PERMANENT_DATA)
 | 
						|
  // Only allow nsTerminator to write on non-leak-checked builds so we don't
 | 
						|
  // get leak warnings on shutdown for intentional leaks (see bug 1242084).
 | 
						|
  // This will be enabled again by bug 1255484 when 1255478 lands.
 | 
						|
  StartWriter();
 | 
						|
#endif  // !defined(NS_FREE_PERMANENT_DATA)
 | 
						|
  mInitialized = true;
 | 
						|
}
 | 
						|
 | 
						|
NS_IMETHODIMP
 | 
						|
nsTerminator::Observe(nsISupports*, const char* aTopic, const char16_t*) {
 | 
						|
  // This Observe is now only used for testing purposes.
 | 
						|
  // XXX: Check if we should change our testing strategy.
 | 
						|
  if (strcmp(aTopic, "terminator-test-quit-application") == 0) {
 | 
						|
    AdvancePhase(mozilla::ShutdownPhase::AppShutdownConfirmed);
 | 
						|
  } else if (strcmp(aTopic, "terminator-test-profile-change-net-teardown") ==
 | 
						|
             0) {
 | 
						|
    AdvancePhase(mozilla::ShutdownPhase::AppShutdownNetTeardown);
 | 
						|
  } else if (strcmp(aTopic, "terminator-test-profile-change-teardown") == 0) {
 | 
						|
    AdvancePhase(mozilla::ShutdownPhase::AppShutdownTeardown);
 | 
						|
  } else if (strcmp(aTopic, "terminator-test-profile-before-change") == 0) {
 | 
						|
    AdvancePhase(mozilla::ShutdownPhase::AppShutdown);
 | 
						|
  } else if (strcmp(aTopic, "terminator-test-profile-before-change-qm") == 0) {
 | 
						|
    AdvancePhase(mozilla::ShutdownPhase::AppShutdownQM);
 | 
						|
  } else if (strcmp(aTopic,
 | 
						|
                    "terminator-test-profile-before-change-telemetry") == 0) {
 | 
						|
    AdvancePhase(mozilla::ShutdownPhase::AppShutdownTelemetry);
 | 
						|
  } else if (strcmp(aTopic, "terminator-test-xpcom-will-shutdown") == 0) {
 | 
						|
    AdvancePhase(mozilla::ShutdownPhase::XPCOMWillShutdown);
 | 
						|
  } else if (strcmp(aTopic, "terminator-test-xpcom-shutdown") == 0) {
 | 
						|
    AdvancePhase(mozilla::ShutdownPhase::XPCOMShutdown);
 | 
						|
  }
 | 
						|
 | 
						|
  return NS_OK;
 | 
						|
}
 | 
						|
 | 
						|
// Prepare, allocate and start the watchdog thread.
 | 
						|
// By design, it will never finish, nor be deallocated.
 | 
						|
void nsTerminator::StartWatchdog() {
 | 
						|
  int32_t crashAfterMS =
 | 
						|
      Preferences::GetInt("toolkit.asyncshutdown.crash_timeout",
 | 
						|
                          FALLBACK_ASYNCSHUTDOWN_CRASH_AFTER_MS);
 | 
						|
  // Ignore negative values
 | 
						|
  if (crashAfterMS <= 0) {
 | 
						|
    crashAfterMS = FALLBACK_ASYNCSHUTDOWN_CRASH_AFTER_MS;
 | 
						|
  }
 | 
						|
 | 
						|
  // Add a little padding, to ensure that we do not crash before
 | 
						|
  // AsyncShutdown.
 | 
						|
  if (crashAfterMS > INT32_MAX - ADDITIONAL_WAIT_BEFORE_CRASH_MS) {
 | 
						|
    // Defend against overflow
 | 
						|
    crashAfterMS = INT32_MAX;
 | 
						|
  } else {
 | 
						|
    crashAfterMS += ADDITIONAL_WAIT_BEFORE_CRASH_MS;
 | 
						|
  }
 | 
						|
 | 
						|
#ifdef MOZ_VALGRIND
 | 
						|
  // If we're running on Valgrind, we'll be making forward progress at a
 | 
						|
  // rate of somewhere between 1/25th and 1/50th of normal.  This can cause
 | 
						|
  // timeouts frequently enough to be a problem for the Valgrind runs on
 | 
						|
  // automation: see bug 1296819.  As an attempt to avoid the worst of this,
 | 
						|
  // scale up the presented timeout by a factor of three.  For a
 | 
						|
  // non-Valgrind-enabled build, or for an enabled build which isn't running
 | 
						|
  // on Valgrind, the timeout is unchanged.
 | 
						|
  if (RUNNING_ON_VALGRIND) {
 | 
						|
    const int32_t scaleUp = 3;
 | 
						|
    if (crashAfterMS >= (INT32_MAX / scaleUp) - 1) {
 | 
						|
      // Defend against overflow
 | 
						|
      crashAfterMS = INT32_MAX;
 | 
						|
    } else {
 | 
						|
      crashAfterMS *= scaleUp;
 | 
						|
    }
 | 
						|
  }
 | 
						|
#endif
 | 
						|
 | 
						|
  UniquePtr<Options> options(new Options());
 | 
						|
  const PRIntervalTime ticksDuration =
 | 
						|
      PR_MillisecondsToInterval(HEARTBEAT_INTERVAL_MS);
 | 
						|
  options->crashAfterTicks = crashAfterMS / ticksDuration;
 | 
						|
  // Handle systems where ticksDuration is greater than crashAfterMS.
 | 
						|
  if (options->crashAfterTicks == 0) {
 | 
						|
    options->crashAfterTicks = crashAfterMS / HEARTBEAT_INTERVAL_MS;
 | 
						|
  }
 | 
						|
 | 
						|
  DebugOnly<PRThread*> watchdogThread =
 | 
						|
      CreateSystemThread(RunWatchdog, options.release());
 | 
						|
  MOZ_ASSERT(watchdogThread);
 | 
						|
}
 | 
						|
 | 
						|
// Prepare, allocate and start the writer thread. By design, it will never
 | 
						|
// finish, nor be deallocated. In case of error, we degrade
 | 
						|
// gracefully to not writing Telemetry data.
 | 
						|
void nsTerminator::StartWriter() {
 | 
						|
  if (!Telemetry::CanRecordExtended()) {
 | 
						|
    return;
 | 
						|
  }
 | 
						|
  nsCOMPtr<nsIFile> profLD;
 | 
						|
  nsresult rv = NS_GetSpecialDirectory(NS_APP_USER_PROFILE_LOCAL_50_DIR,
 | 
						|
                                       getter_AddRefs(profLD));
 | 
						|
  if (NS_FAILED(rv)) {
 | 
						|
    return;
 | 
						|
  }
 | 
						|
 | 
						|
  rv = profLD->Append(u"ShutdownDuration.json"_ns);
 | 
						|
  if (NS_FAILED(rv)) {
 | 
						|
    return;
 | 
						|
  }
 | 
						|
 | 
						|
  nsAutoString path;
 | 
						|
  rv = profLD->GetPath(path);
 | 
						|
  if (NS_FAILED(rv)) {
 | 
						|
    return;
 | 
						|
  }
 | 
						|
 | 
						|
  gWriteReady = PR_NewMonitor();
 | 
						|
  MOZ_LSAN_INTENTIONALLY_LEAK_OBJECT(
 | 
						|
      gWriteReady);  // We will never deallocate this object
 | 
						|
  PRThread* writerThread = CreateSystemThread(RunWriter, ToNewUTF8String(path));
 | 
						|
 | 
						|
  if (!writerThread) {
 | 
						|
    return;
 | 
						|
  }
 | 
						|
}
 | 
						|
 | 
						|
void nsTerminator::AdvancePhase(mozilla::ShutdownPhase aPhase) {
 | 
						|
  // If we are done, do nothing
 | 
						|
  if (sShutdownNotified) {
 | 
						|
    return;
 | 
						|
  }
 | 
						|
  // As we have seen examples in the wild of shutdown notifications
 | 
						|
  // not being sent (or not being sent in the expected order), we do
 | 
						|
  // not assume a specific order.
 | 
						|
  if (!mInitialized) {
 | 
						|
    Start();
 | 
						|
  }
 | 
						|
 | 
						|
  UpdateHeartbeat(GetStepForPhase(aPhase));
 | 
						|
#if !defined(NS_FREE_PERMANENT_DATA)
 | 
						|
  // Only allow nsTerminator to write on non-leak checked builds so we don't get
 | 
						|
  // leak warnings on shutdown for intentional leaks (see bug 1242084). This
 | 
						|
  // will be enabled again by bug 1255484 when 1255478 lands.
 | 
						|
  UpdateTelemetry();
 | 
						|
#endif  // !defined(NS_FREE_PERMANENT_DATA)
 | 
						|
  UpdateCrashReport(mozilla::AppShutdown::GetObserverKey(aPhase));
 | 
						|
}
 | 
						|
 | 
						|
void nsTerminator::UpdateHeartbeat(int32_t aStep) {
 | 
						|
  MOZ_ASSERT(aStep >= mCurrentStep);
 | 
						|
 | 
						|
  if (aStep > mCurrentStep) {
 | 
						|
    // Reset the clock, find out how long the current phase has lasted.
 | 
						|
    uint32_t ticks = gHeartbeat.exchange(0);
 | 
						|
    if (mCurrentStep >= 0) {
 | 
						|
      sShutdownSteps[mCurrentStep].mTicks = ticks;
 | 
						|
    }
 | 
						|
    sShutdownSteps[aStep].mTicks = 0;
 | 
						|
 | 
						|
    mCurrentStep = aStep;
 | 
						|
  }
 | 
						|
}
 | 
						|
 | 
						|
void nsTerminator::UpdateTelemetry() {
 | 
						|
  if (!Telemetry::CanRecordExtended() || !gWriteReady) {
 | 
						|
    return;
 | 
						|
  }
 | 
						|
 | 
						|
  //
 | 
						|
  // We need Telemetry data on the effective duration of each step,
 | 
						|
  // to be able to tune the time-to-crash of each of both the
 | 
						|
  // Terminator and AsyncShutdown. However, at this stage, it is too
 | 
						|
  // late to record such data into Telemetry, so we write it to disk
 | 
						|
  // and read it upon the next startup.
 | 
						|
  //
 | 
						|
 | 
						|
  // Build JSON.
 | 
						|
  UniquePtr<nsCString> telemetryData(new nsCString());
 | 
						|
  telemetryData->AppendLiteral("{");
 | 
						|
  size_t fields = 0;
 | 
						|
  for (auto& shutdownStep : sShutdownSteps) {
 | 
						|
    if (shutdownStep.mTicks < 0) {
 | 
						|
      // Ignore this field.
 | 
						|
      continue;
 | 
						|
    }
 | 
						|
    if (fields++ > 0) {
 | 
						|
      telemetryData->AppendLiteral(", ");
 | 
						|
    }
 | 
						|
    telemetryData->AppendLiteral(R"(")");
 | 
						|
    telemetryData->Append(
 | 
						|
        mozilla::AppShutdown::GetObserverKey(shutdownStep.mPhase));
 | 
						|
    telemetryData->AppendLiteral(R"(": )");
 | 
						|
    telemetryData->AppendInt(shutdownStep.mTicks);
 | 
						|
  }
 | 
						|
  telemetryData->AppendLiteral("}");
 | 
						|
 | 
						|
  if (fields == 0) {
 | 
						|
    // Nothing to write
 | 
						|
    return;
 | 
						|
  }
 | 
						|
 | 
						|
  //
 | 
						|
  // Send data to the worker thread.
 | 
						|
  //
 | 
						|
  delete gWriteData.exchange(
 | 
						|
      telemetryData.release());  // Clear any data that hasn't been written yet
 | 
						|
 | 
						|
  // In case the worker thread was sleeping, wake it up.
 | 
						|
  PR_EnterMonitor(gWriteReady);
 | 
						|
  PR_Notify(gWriteReady);
 | 
						|
  PR_ExitMonitor(gWriteReady);
 | 
						|
}
 | 
						|
 | 
						|
void nsTerminator::UpdateCrashReport(const char* aTopic) {
 | 
						|
  // In case of crash, we wish to know where in shutdown we are
 | 
						|
  nsAutoCString report(aTopic);
 | 
						|
 | 
						|
  Unused << CrashReporter::AnnotateCrashReport(
 | 
						|
      CrashReporter::Annotation::ShutdownProgress, report);
 | 
						|
}
 | 
						|
 | 
						|
void XPCOMShutdownNotified() {
 | 
						|
  MOZ_DIAGNOSTIC_ASSERT(sShutdownNotified == false);
 | 
						|
  sShutdownNotified = true;
 | 
						|
}
 | 
						|
 | 
						|
}  // namespace mozilla
 |