/* $Id: tstPrfRT.cpp 62571 2016-07-26 15:58:26Z vboxsync $ */ /** @file * IPRT testcase - profile some of the important functions. */ /* * Copyright (C) 2006-2016 Oracle Corporation * * This file is part of VirtualBox Open Source Edition (OSE), as * available from http://www.virtualbox.org. This file is free software; * you can redistribute it and/or modify it under the terms of the GNU * General Public License (GPL) as published by the Free Software * Foundation, in version 2 as it comes in the "COPYING" file of the * VirtualBox OSE distribution. VirtualBox OSE is distributed in the * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind. * * The contents of this file may alternatively be used under the terms * of the Common Development and Distribution License Version 1.0 * (CDDL) only, as it comes in the "COPYING.CDDL" file of the * VirtualBox OSE distribution, in which case the provisions of the * CDDL are applicable instead of those of the GPL. * * You may elect to license modified versions of this file under the * terms and conditions of either the GPL or the CDDL or both. */ /********************************************************************************************************************************* * Header Files * *********************************************************************************************************************************/ #include #include #include #include #include #if defined(RT_ARCH_AMD64) || defined(RT_ARCH_X86) # include #endif /********************************************************************************************************************************* * Internal Functions * *********************************************************************************************************************************/ #if defined(RT_ARCH_AMD64) || defined(RT_ARCH_X86) DECLASM(void) tstRTPRfAMemoryAccess(void); DECLASM(void) tstRTPRfARegisterAccess(void); DECLASM(void) tstRTPRfAMemoryUnalignedAccess(void); #endif /********************************************************************************************************************************* * Global Variables * *********************************************************************************************************************************/ static RTTEST g_hTest; #if defined(RT_ARCH_AMD64) || defined(RT_ARCH_X86) void PrintResult(uint64_t u64Ticks, uint64_t u64MaxTicks, uint64_t u64MinTicks, unsigned cTimes, const char *pszOperation) { //RTTestPrintf(g_hTest, RTTESTLVL_ALWAYS, // "%-32s %5lld / %5lld / %5lld ticks per call (%u calls %lld ticks)\n", // pszOperation, u64MinTicks, u64Ticks / (uint64_t)cTimes, u64MaxTicks, cTimes, u64Ticks); //RTTestValueF(g_hTest, u64MinTicks, RTTESTUNIT_NONE, "%s min ticks", pszOperation); RTTestValueF(g_hTest, u64Ticks / (uint64_t)cTimes, RTTESTUNIT_NONE, "%s avg ticks", pszOperation); //RTTestValueF(g_hTest, u64MaxTicks, RTTESTUNIT_NONE, "%s max ticks", pszOperation); RT_NOREF_PV(u64MaxTicks); RT_NOREF_PV(u64MinTicks); } # define ITERATE(preexpr, expr, postexpr, cIterations) \ AssertCompile(((cIterations) % 8) == 0); \ /* Min and max value. */ \ for (i = 0, u64MinTS = ~0, u64MaxTS = 0; i < (cIterations); i++) \ { \ { preexpr } \ uint64_t u64StartTS = ASMReadTSC(); \ { expr } \ uint64_t u64ElapsedTS = ASMReadTSC() - u64StartTS; \ { postexpr } \ if (u64ElapsedTS > u64MinTS * 32) \ { \ i--; \ continue; \ } \ if (u64ElapsedTS < u64MinTS) \ u64MinTS = u64ElapsedTS; \ if (u64ElapsedTS > u64MaxTS) \ u64MaxTS = u64ElapsedTS; \ } \ { \ /* Calculate a good average value (may be smaller than min). */ \ i = (cIterations); \ AssertRelease((i % 8) == 0); \ { preexpr } \ uint64_t u64StartTS = ASMReadTSC(); \ while (i != 0) \ { \ { expr } \ { expr } \ { expr } \ { expr } \ { expr } \ { expr } \ { expr } \ { expr } \ i -= 8; \ } \ u64TotalTS = ASMReadTSC() - u64StartTS; \ { postexpr } \ i = (cIterations); \ } #else /* !AMD64 && !X86 */ void PrintResult(uint64_t cNs, uint64_t cNsMax, uint64_t cNsMin, unsigned cTimes, const char *pszOperation) { //RTTestPrintf(g_hTest, RTTESTLVL_ALWAYS, // "%-32s %5lld / %5lld / %5lld ns per call (%u calls %lld ns)\n", // pszOperation, cNsMin, cNs / (uint64_t)cTimes, cNsMax, cTimes, cNs); //RTTestValueF(g_hTest, cNsMin, RTTESTUNIT_NS_PER_CALL, "%s min", pszOperation); RTTestValueF(g_hTest, cNs / (uint64_t)cTimes, RTTESTUNIT_NS_PER_CALL, "%s avg", pszOperation); //RTTestValueF(g_hTest, cNsMax, RTTESTUNIT_NS_PER_CALL, "%s max", pszOperation); } # define ITERATE(preexpr, expr, postexpr, cIterations) \ for (i = 0, u64TotalTS = 0, u64MinTS = ~0, u64MaxTS = 0; i < (cIterations); i++) \ { \ { preexpr } \ uint64_t u64StartTS = RTTimeNanoTS(); \ { expr } \ uint64_t u64ElapsedTS = RTTimeNanoTS() - u64StartTS; \ { postexpr } \ if (u64ElapsedTS > u64MinTS * 32) \ { \ i--; \ continue; \ } \ if (u64ElapsedTS < u64MinTS) \ u64MinTS = u64ElapsedTS; \ if (u64ElapsedTS > u64MaxTS) \ u64MaxTS = u64ElapsedTS; \ u64TotalTS += u64ElapsedTS; \ } #endif /* !AMD64 && !X86 */ int main(int argc, char **argv) { uint64_t u64TotalTS; uint64_t u64MinTS; uint64_t u64MaxTS; unsigned i; RTEXITCODE rcExit = RTTestInitExAndCreate(argc, &argv, argc == 2 ? RTR3INIT_FLAGS_SUPLIB : 0, "tstRTPrf", &g_hTest); if (rcExit != RTEXITCODE_SUCCESS) return rcExit; RTTestBanner(g_hTest); /* * RTTimeNanoTS, RTTimeProgramNanoTS, RTTimeMilliTS, and RTTimeProgramMilliTS. */ ITERATE(RT_NOTHING, RTTimeNanoTS();, RT_NOTHING, _1M * 32); PrintResult(u64TotalTS, u64MaxTS, u64MinTS, i, "RTTimeNanoTS"); ITERATE(RT_NOTHING, RTTimeProgramNanoTS();, RT_NOTHING, 1000000); PrintResult(u64TotalTS, u64MaxTS, u64MinTS, i, "RTTimeProgramNanoTS"); ITERATE(RT_NOTHING, RTTimeMilliTS();, RT_NOTHING, 1000000); PrintResult(u64TotalTS, u64MaxTS, u64MinTS, i, "RTTimeMilliTS"); ITERATE(RT_NOTHING, RTTimeProgramMilliTS();, RT_NOTHING, 1000000); PrintResult(u64TotalTS, u64MaxTS, u64MinTS, i, "RTTimeProgramMilliTS"); /* * RTTimeNow */ RTTIMESPEC Time; ITERATE(RT_NOTHING, RTTimeNow(&Time);, RT_NOTHING, 1000000); PrintResult(u64TotalTS, u64MaxTS, u64MinTS, i, "RTTimeNow"); /* * RTLogDefaultInstance() */ ITERATE(RT_NOTHING, RTLogDefaultInstance();, RT_NOTHING, 1000000); PrintResult(u64TotalTS, u64MaxTS, u64MinTS, i, "RTLogDefaultInstance"); /* * RTThreadSelf and RTThreadNativeSelf */ ITERATE(RT_NOTHING, RTThreadSelf();, RT_NOTHING, 1000000); PrintResult(u64TotalTS, u64MaxTS, u64MinTS, i, "RTThreadSelf"); ITERATE(RT_NOTHING, RTThreadNativeSelf();, RT_NOTHING, 1000000); PrintResult(u64TotalTS, u64MaxTS, u64MinTS, i, "RTThreadNativeSelf"); #if defined(RT_ARCH_X86) || defined(RT_ARCH_AMD64) /* * Registers vs stack. */ ITERATE(RT_NOTHING, tstRTPRfARegisterAccess();, RT_NOTHING, 1000); uint64_t const cRegTotal = u64TotalTS; //PrintResult(u64TotalTS, u64MaxTS, u64MinTS, i, "Register only algorithm"); ITERATE(RT_NOTHING, tstRTPRfAMemoryAccess();, RT_NOTHING, 1000); uint64_t const cMemTotal = u64TotalTS; //PrintResult(u64TotalTS, u64MaxTS, u64MinTS, i, "Memory only algorithm"); ITERATE(RT_NOTHING, tstRTPRfAMemoryUnalignedAccess();, RT_NOTHING, 1000); uint64_t const cMemUnalignedTotal = u64TotalTS; //PrintResult(u64TotalTS, u64MaxTS, u64MinTS, i, "Memory only algorithm"); uint64_t const cSlower100 = cMemTotal * 100 / cRegTotal; RTTestValue(g_hTest, "Memory instead of registers slowdown", cSlower100, RTTESTUNIT_PCT); uint64_t const cUnalignedSlower100 = cMemUnalignedTotal * 100 / cRegTotal; RTTestValue(g_hTest, "Unaligned memory instead of registers slowdown", cUnalignedSlower100, RTTESTUNIT_PCT); #endif return RTTestSummaryAndDestroy(g_hTest); }