/* -*- Mode: C++; tab-width: 8; indent-tabs-mode: nil; c-basic-offset: 2 -*- */ /* vim: set ts=8 sts=2 et sw=2 tw=80: */ // Copyright (c) 2006-2011 The Chromium Authors. All rights reserved. // // Redistribution and use in source and binary forms, with or without // modification, are permitted provided that the following conditions // are met: // * Redistributions of source code must retain the above copyright // notice, this list of conditions and the following disclaimer. // * Redistributions in binary form must reproduce the above copyright // notice, this list of conditions and the following disclaimer in // the documentation and/or other materials provided with the // distribution. // * Neither the name of Google, Inc. nor the names of its contributors // may be used to endorse or promote products derived from this // software without specific prior written permission. // // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS // FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE // COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, // INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, // BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS // OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED // AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, // OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT // OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF // SUCH DAMAGE. #include #include #include #include "nsWindowsDllInterceptor.h" #include "mozilla/StackWalk_windows.h" #include "mozilla/WindowsVersion.h" namespace mozilla { namespace baseprofiler { static int64_t MicrosecondsSince1970() { int64_t prt; FILETIME ft; SYSTEMTIME st; GetSystemTime(&st); SystemTimeToFileTime(&st, &ft); static_assert(sizeof(ft) == sizeof(prt), "Expect FILETIME to be 64 bits"); memcpy(&prt, &ft, sizeof(prt)); const int64_t epochBias = 116444736000000000LL; prt = (prt - epochBias) / 10; return prt; } void* GetStackTop(void* aGuess) { PNT_TIB pTib = reinterpret_cast(NtCurrentTeb()); return reinterpret_cast(pTib->StackBase); } static void PopulateRegsFromContext(Registers& aRegs, CONTEXT* aContext) { #if defined(GP_ARCH_amd64) aRegs.mPC = reinterpret_cast
(aContext->Rip); aRegs.mSP = reinterpret_cast
(aContext->Rsp); aRegs.mFP = reinterpret_cast
(aContext->Rbp); aRegs.mLR = 0; #elif defined(GP_ARCH_x86) aRegs.mPC = reinterpret_cast
(aContext->Eip); aRegs.mSP = reinterpret_cast
(aContext->Esp); aRegs.mFP = reinterpret_cast
(aContext->Ebp); aRegs.mLR = 0; #elif defined(GP_ARCH_arm64) aRegs.mPC = reinterpret_cast
(aContext->Pc); aRegs.mSP = reinterpret_cast
(aContext->Sp); aRegs.mFP = reinterpret_cast
(aContext->Fp); aRegs.mLR = reinterpret_cast
(aContext->Lr); #else # error "bad arch" #endif } // Gets a real (i.e. not pseudo) handle for the current thread, with the // permissions needed for profiling. // @return a real HANDLE for the current thread. static HANDLE GetRealCurrentThreadHandleForProfiling() { HANDLE realCurrentThreadHandle; if (!::DuplicateHandle( ::GetCurrentProcess(), ::GetCurrentThread(), ::GetCurrentProcess(), &realCurrentThreadHandle, THREAD_GET_CONTEXT | THREAD_SUSPEND_RESUME | THREAD_QUERY_INFORMATION, FALSE, 0)) { return nullptr; } return realCurrentThreadHandle; } class PlatformData { public: // Get a handle to the calling thread. This is the thread that we are // going to profile. We need a real handle because we are going to use it in // the sampler thread. explicit PlatformData(BaseProfilerThreadId aThreadId) : mProfiledThread(GetRealCurrentThreadHandleForProfiling()) { MOZ_ASSERT(DWORD(aThreadId.ToNumber()) == ::GetCurrentThreadId()); } ~PlatformData() { if (mProfiledThread != nullptr) { CloseHandle(mProfiledThread); mProfiledThread = nullptr; } } HANDLE ProfiledThread() { return mProfiledThread; } private: HANDLE mProfiledThread; }; #if defined(USE_MOZ_STACK_WALK) HANDLE GetThreadHandle(PlatformData* aData) { return aData->ProfiledThread(); } #endif static const HANDLE kNoThread = INVALID_HANDLE_VALUE; //////////////////////////////////////////////////////////////////////// // BEGIN Sampler target specifics Sampler::Sampler(PSLockRef aLock) {} void Sampler::Disable(PSLockRef aLock) {} template void Sampler::SuspendAndSampleAndResumeThread( PSLockRef aLock, const RegisteredThread& aRegisteredThread, const TimeStamp& aNow, const Func& aProcessRegs) { HANDLE profiled_thread = aRegisteredThread.GetPlatformData()->ProfiledThread(); if (profiled_thread == nullptr) { return; } // Context used for sampling the register state of the profiled thread. CONTEXT context; memset(&context, 0, sizeof(context)); //----------------------------------------------------------------// // Suspend the samplee thread and get its context. static const DWORD kSuspendFailed = static_cast(-1); if (SuspendThread(profiled_thread) == kSuspendFailed) { return; } // SuspendThread is asynchronous, so the thread may still be running. // Call GetThreadContext first to ensure the thread is really suspended. // See https://blogs.msdn.microsoft.com/oldnewthing/20150205-00/?p=44743. // Using only CONTEXT_CONTROL is faster but on 64-bit it causes crashes in // RtlVirtualUnwind (see bug 1120126) so we set all the flags. #if defined(GP_ARCH_amd64) context.ContextFlags = CONTEXT_FULL; #else context.ContextFlags = CONTEXT_CONTROL; #endif if (!GetThreadContext(profiled_thread, &context)) { ResumeThread(profiled_thread); return; } //----------------------------------------------------------------// // Sample the target thread. // WARNING WARNING WARNING WARNING WARNING WARNING WARNING WARNING // // The profiler's "critical section" begins here. We must be very careful // what we do here, or risk deadlock. See the corresponding comment in // platform-linux-android.cpp for details. Registers regs; PopulateRegsFromContext(regs, &context); aProcessRegs(regs, aNow); //----------------------------------------------------------------// // Resume the target thread. ResumeThread(profiled_thread); // The profiler's critical section ends here. // // WARNING WARNING WARNING WARNING WARNING WARNING WARNING WARNING } // END Sampler target specifics //////////////////////////////////////////////////////////////////////// //////////////////////////////////////////////////////////////////////// // BEGIN SamplerThread target specifics static unsigned int __stdcall ThreadEntry(void* aArg) { auto thread = static_cast(aArg); thread->Run(); return 0; } SamplerThread::SamplerThread(PSLockRef aLock, uint32_t aActivityGeneration, double aIntervalMilliseconds, uint32_t aFeatures) : mSampler(aLock), mActivityGeneration(aActivityGeneration), mIntervalMicroseconds( std::max(1, int(floor(aIntervalMilliseconds * 1000 + 0.5)))), mNoTimerResolutionChange( ProfilerFeature::HasNoTimerResolutionChange(aFeatures)) { if ((!mNoTimerResolutionChange) && (mIntervalMicroseconds < 10 * 1000)) { // By default the timer resolution (which tends to be 1/64Hz, around 16ms) // is not changed. However, if the requested interval is sufficiently low, // the resolution will be adjusted to match. Note that this affects all // timers in Firefox, and could therefore hide issues while profiling. This // change may be prevented with the "notimerresolutionchange" feature. ::timeBeginPeriod(mIntervalMicroseconds / 1000); } // Create a new thread. It is important to use _beginthreadex() instead of // the Win32 function CreateThread(), because the CreateThread() does not // initialize thread-specific structures in the C runtime library. mThread = reinterpret_cast(_beginthreadex(nullptr, /* stack_size */ 0, ThreadEntry, this, /* initflag */ 0, nullptr)); if (mThread == 0) { MOZ_CRASH("_beginthreadex failed"); } } SamplerThread::~SamplerThread() { WaitForSingleObject(mThread, INFINITE); // Close our own handle for the thread. if (mThread != kNoThread) { CloseHandle(mThread); } } void SamplerThread::SleepMicro(uint32_t aMicroseconds) { // For now, keep the old behaviour of minimum Sleep(1), even for // smaller-than-usual sleeps after an overshoot, unless the user has // explicitly opted into a sub-millisecond profiler interval. if (mIntervalMicroseconds >= 1000) { ::Sleep(std::max(1u, aMicroseconds / 1000)); } else { TimeStamp start = TimeStamp::Now(); TimeStamp end = start + TimeDuration::FromMicroseconds(aMicroseconds); // First, sleep for as many whole milliseconds as possible. if (aMicroseconds >= 1000) { ::Sleep(aMicroseconds / 1000); } // Then, spin until enough time has passed. while (TimeStamp::Now() < end) { YieldProcessor(); } } } void SamplerThread::Stop(PSLockRef aLock) { if ((!mNoTimerResolutionChange) && (mIntervalMicroseconds < 10 * 1000)) { // Disable any timer resolution changes we've made. Do it now while // gPSMutex is locked, i.e. before any other SamplerThread can be created // and call ::timeBeginPeriod(). // // It's safe to do this now even though this SamplerThread is still alive, // because the next time the main loop of Run() iterates it won't get past // the mActivityGeneration check, and so it won't make any more ::Sleep() // calls. ::timeEndPeriod(mIntervalMicroseconds / 1000); } mSampler.Disable(aLock); } // END SamplerThread target specifics //////////////////////////////////////////////////////////////////////// static void PlatformInit(PSLockRef aLock) {} #if defined(HAVE_NATIVE_UNWIND) # define REGISTERS_SYNC_POPULATE(regs) \ CONTEXT context; \ RtlCaptureContext(&context); \ PopulateRegsFromContext(regs, &context); #endif #if defined(GP_PLAT_amd64_windows) static WindowsDllInterceptor NtDllIntercept; typedef NTSTATUS(NTAPI* LdrUnloadDll_func)(HMODULE module); static WindowsDllInterceptor::FuncHookType stub_LdrUnloadDll; static NTSTATUS NTAPI patched_LdrUnloadDll(HMODULE module) { // Prevent the stack walker from suspending this thread when LdrUnloadDll // holds the RtlLookupFunctionEntry lock. AutoSuppressStackWalking suppress; return stub_LdrUnloadDll(module); } // These pointers are disguised as PVOID to avoid pulling in obscure headers typedef PVOID(WINAPI* LdrResolveDelayLoadedAPI_func)( PVOID ParentModuleBase, PVOID DelayloadDescriptor, PVOID FailureDllHook, PVOID FailureSystemHook, PVOID ThunkAddress, ULONG Flags); static WindowsDllInterceptor::FuncHookType stub_LdrResolveDelayLoadedAPI; static PVOID WINAPI patched_LdrResolveDelayLoadedAPI( PVOID ParentModuleBase, PVOID DelayloadDescriptor, PVOID FailureDllHook, PVOID FailureSystemHook, PVOID ThunkAddress, ULONG Flags) { // Prevent the stack walker from suspending this thread when // LdrResolveDelayLoadAPI holds the RtlLookupFunctionEntry lock. AutoSuppressStackWalking suppress; return stub_LdrResolveDelayLoadedAPI(ParentModuleBase, DelayloadDescriptor, FailureDllHook, FailureSystemHook, ThunkAddress, Flags); } MFBT_API void InitializeWin64ProfilerHooks() { // This function could be called by both profilers, but we only want to run // it once. static bool ran = false; if (ran) { return; } ran = true; NtDllIntercept.Init("ntdll.dll"); stub_LdrUnloadDll.Set(NtDllIntercept, "LdrUnloadDll", &patched_LdrUnloadDll); if (IsWin8OrLater()) { // LdrResolveDelayLoadedAPI was introduced in Win8 stub_LdrResolveDelayLoadedAPI.Set(NtDllIntercept, "LdrResolveDelayLoadedAPI", &patched_LdrResolveDelayLoadedAPI); } } #endif // defined(GP_PLAT_amd64_windows) } // namespace baseprofiler } // namespace mozilla