/* Copyright (c) 2009-2012, Intel Corporation All rights reserved. Redistribution and use in source and binary forms, with or without modification, are permitted provided that the following conditions are met: * Redistributions of source code must retain the above copyright notice, this list of conditions and the following disclaimer. * Redistributions in binary form must reproduce the above copyright notice, this list of conditions and the following disclaimer in the documentation and/or other materials provided with the distribution. * Neither the name of Intel Corporation nor the names of its contributors may be used to endorse or promote products derived from this software without specific prior written permission. THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. */ /* ** Written by Otto Bruggeman, Roman Dementiev */ #pragma once #pragma unmanaged #include "..\PCM-Lib_Win\pcm-lib.h" #include "..\PCM_Win\windriver.h" #include #pragma managed using namespace pcm; using namespace System; using namespace System::Collections; using namespace System::ServiceProcess; using namespace System::ComponentModel; using namespace System::Diagnostics; using namespace System::Threading; using namespace System::Runtime::InteropServices; namespace PCMServiceNS { ref struct Globals { static initonly String^ ServiceName = gcnew String(L"PCMService"); }; ref struct CollectionInformation { CollectionInformation() { core = true; socket = true; qpi = true; } CollectionInformation(const CollectionInformation^ ©able) { core = copyable->core; socket = copyable->socket; qpi = copyable->qpi; } bool core; bool socket; bool qpi; }; ref class MeasureThread { public: MeasureThread(System::Diagnostics::EventLog^ log, int sampleRate, CollectionInformation^ collectionInformation) : log_(log), sampleRate_(sampleRate), collectionInformation_(collectionInformation) { // Get a Monitor instance which sets up the PMU, it also figures out the number of cores and sockets which we need later on to create the performance counters m_ = PCM::getInstance(); if ( !m_->good() ) { log_->WriteEntry(Globals::ServiceName, "Monitor Instance could not be created.", EventLogEntryType::Error); m_->cleanup(); String^ s = gcnew String(m_->getErrorMessage().c_str()); throw gcnew Exception(s); } log_->WriteEntry(Globals::ServiceName, "PCM: Number of cores detected: " + UInt32(m_->getNumCores()).ToString()); m_->program(); log_->WriteEntry(Globals::ServiceName, "PMU Programmed."); // This here will only create the necessary registry entries, the actual counters are created later. // New unified category if (PerformanceCounterCategory::Exists(CountersCore)) { PerformanceCounterCategory::Delete(CountersCore); } if (PerformanceCounterCategory::Exists(CountersSocket)) { PerformanceCounterCategory::Delete(CountersSocket); } if (PerformanceCounterCategory::Exists(CountersQpi)) { PerformanceCounterCategory::Delete(CountersQpi); } log_->WriteEntry(Globals::ServiceName, "Old categories deleted."); // First create the collection, then add counters to it so we add them all at once CounterCreationDataCollection^ counterCollection = gcnew CounterCreationDataCollection; // Here we add the counters one by one, need list of counters currently collected. // This is a stub: copy and paste when new counters are added to ipcustat "library". // CounterCreationData^ counter = gcnew CounterCreationData( "counter", "helptext for counter", PerformanceCounterType::NumberOfItems64 ); // counterCollection->Add( counter ); CounterCreationData^ counter; if (collectionInformation_->core) { counter = gcnew CounterCreationData(MetricCoreClocktick, "Displays the number of clockticks elapsed since previous measurement.", PerformanceCounterType::CounterDelta64); counterCollection->Add( counter ); counter = gcnew CounterCreationData(MetricCoreRetired, "Displays the number of instructions retired since previous measurement.", PerformanceCounterType::CounterDelta64); counterCollection->Add( counter ); counter = gcnew CounterCreationData(MetricCoreMissL2, "Displays the L2 Cache Misses caused by this core.", PerformanceCounterType::CounterDelta64); counterCollection->Add( counter ); counter = gcnew CounterCreationData(MetricCoreMissL3, "Displays the L3 Cache Misses caused by this core.", PerformanceCounterType::CounterDelta64); counterCollection->Add( counter ); counter = gcnew CounterCreationData(MetricCoreIpc, "Displays the instructions per clocktick executed for this core.", PerformanceCounterType::AverageCount64); counterCollection->Add( counter ); counter = gcnew CounterCreationData(MetricCoreBaseIpc, "Not visible", PerformanceCounterType::AverageBase); counterCollection->Add( counter ); counter = gcnew CounterCreationData(MetricCoreFreqRel, "Displays the current frequency of the core to its rated frequency in percent.", PerformanceCounterType::SampleFraction); counterCollection->Add( counter ); counter = gcnew CounterCreationData(MetricCoreFreqNom, "Not visible", PerformanceCounterType::SampleBase); counterCollection->Add( counter ); counter = gcnew CounterCreationData(MetricCoreHeadroom, "Displays temperature reading in 1 degree Celsius relative to the TjMax temperature. 0 corresponds to the max temperature.", PerformanceCounterType::NumberOfItems64); counterCollection->Add( counter ); counter = gcnew CounterCreationData(MetricCoreResC0, "Displays the residency of core or socket in core C0-state in percent.", PerformanceCounterType::NumberOfItems64); counterCollection->Add( counter ); counter = gcnew CounterCreationData(MetricCoreResC3, "Displays the residency of core or socket in core C3-state in percent.", PerformanceCounterType::NumberOfItems64); counterCollection->Add( counter ); counter = gcnew CounterCreationData(MetricCoreResC6, "Displays the residency of core or socket in core C6-state in percent.", PerformanceCounterType::NumberOfItems64); counterCollection->Add( counter ); counter = gcnew CounterCreationData(MetricCoreResC7, "Displays the residency of core or socket in core C7-state in percent.", PerformanceCounterType::NumberOfItems64); counterCollection->Add( counter ); PerformanceCounterCategory::Create(CountersCore, "Processor Counter Monitor", PerformanceCounterCategoryType::MultiInstance, counterCollection); } if (collectionInformation_->socket) { counterCollection->Clear(); counter = gcnew CounterCreationData(MetricSocketBandRead, "Displays the memory read bandwidth in bytes/s of this socket.", PerformanceCounterType::NumberOfItems64); counterCollection->Add( counter ); counter = gcnew CounterCreationData(MetricSocketBandWrite, "Displays the memory write bandwidth in bytes/s of this socket.", PerformanceCounterType::NumberOfItems64); counterCollection->Add( counter ); counter = gcnew CounterCreationData(MetricSocketEnergyPack, "Displays the energy in Joules consumed by this socket.", PerformanceCounterType::NumberOfItems64); counterCollection->Add( counter ); counter = gcnew CounterCreationData(MetricSocketEnergyDram, "Displays the energy in Joules consumed by DRAM memory attached to the memory controller of this socket.", PerformanceCounterType::NumberOfItems64); counterCollection->Add( counter ); counter = gcnew CounterCreationData(MetricSocketResC2, "Displays the residency of socket in package C2-state in percent.", PerformanceCounterType::NumberOfItems64); counterCollection->Add( counter ); counter = gcnew CounterCreationData(MetricSocketResC3, "Displays the residency of socket in package C3-state in percent.", PerformanceCounterType::NumberOfItems64); counterCollection->Add( counter ); counter = gcnew CounterCreationData(MetricSocketResC6, "Displays the residency of socket in package C6-state in percent.", PerformanceCounterType::NumberOfItems64); counterCollection->Add( counter ); counter = gcnew CounterCreationData(MetricSocketResC7, "Displays the residency of socket in package C7-state in percent.", PerformanceCounterType::NumberOfItems64); counterCollection->Add( counter ); PerformanceCounterCategory::Create(CountersSocket, "Processor Counter Monitor", PerformanceCounterCategoryType::MultiInstance, counterCollection); } if (collectionInformation_->qpi) { counterCollection->Clear(); counter = gcnew CounterCreationData(MetricQpiBand, "Displays the incoming bandwidth in bytes/s of this QPI link.", PerformanceCounterType::CounterDelta64); counterCollection->Add( counter ); PerformanceCounterCategory::Create(CountersQpi, "Processor Counter Monitor", PerformanceCounterCategoryType::MultiInstance, counterCollection); } log_->WriteEntry(Globals::ServiceName, "New categories added."); // Registry entries created, now we need to create the programmatic counters. For some things you may want one instance for every core/thread/socket/qpilink so create in a loop. // PerformanceCounter^ pc1 = gcnew PerformanceCounter( "SomeCounterName", "nameOfCounterAsEnteredInTheRegistry", "instanceNameOfCounterAsANumber" ); // Create #processors instances of the core specific performance counters String^ s; // Used for creating the instance name and the string to search for in the hashtable for ( unsigned int i = 0; i < m_->getNumCores(); ++i ) { s = UInt32(i).ToString(); // For core counters we use just the number of the core if (collectionInformation_->core) { ticksHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreClocktick, s, false)); instRetHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreRetired, s, false)); l2CacheMissHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreMissL2, s, false)); l3CacheMissHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreMissL3, s, false)); ipcHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreIpc, s, false)); baseTicksForIpcHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreBaseIpc, s, false)); relFreqHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreFreqRel, s, false)); baseTicksForRelFreqHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreFreqNom, s, false)); thermalHeadroomHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreHeadroom, s, false)); CoreC0StateResidencyHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreResC0, s, false)); CoreC3StateResidencyHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreResC3, s, false)); CoreC6StateResidencyHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreResC6, s, false)); CoreC7StateResidencyHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreResC7, s, false)); } } // Create socket instances of the common core counters, names are Socket+number for ( unsigned int i=0; igetNumSockets(); ++i ) { s = "Socket"+UInt32(i).ToString(); if (collectionInformation_->core) { ticksHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreClocktick, s, false)); instRetHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreRetired, s, false)); l2CacheMissHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreMissL2, s, false)); l3CacheMissHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreMissL3, s, false)); ipcHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreIpc, s, false)); baseTicksForIpcHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreBaseIpc, s, false)); relFreqHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreFreqRel, s, false)); baseTicksForRelFreqHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreFreqNom, s, false)); thermalHeadroomHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreHeadroom, s, false)); CoreC0StateResidencyHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreResC0, s, false)); CoreC3StateResidencyHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreResC3, s, false)); CoreC6StateResidencyHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreResC6, s, false)); CoreC7StateResidencyHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreResC7, s, false)); } if (collectionInformation_->socket) { mrbHash_.Add(s, gcnew PerformanceCounter(CountersSocket, MetricSocketBandRead, s, false)); mwbHash_.Add(s, gcnew PerformanceCounter(CountersSocket, MetricSocketBandWrite, s, false)); packageEnergyHash_.Add(s, gcnew PerformanceCounter(CountersSocket, MetricSocketEnergyPack, s, false)); DRAMEnergyHash_.Add(s, gcnew PerformanceCounter(CountersSocket, MetricSocketEnergyDram, s, false)); PackageC2StateResidencyHash_.Add(s, gcnew PerformanceCounter(CountersSocket, MetricSocketResC2, s, false)); PackageC3StateResidencyHash_.Add(s, gcnew PerformanceCounter(CountersSocket, MetricSocketResC3, s, false)); PackageC6StateResidencyHash_.Add(s, gcnew PerformanceCounter(CountersSocket, MetricSocketResC6, s, false)); PackageC7StateResidencyHash_.Add(s, gcnew PerformanceCounter(CountersSocket, MetricSocketResC7, s, false)); } if (collectionInformation_->qpi) { qpiHash_.Add(s, gcnew PerformanceCounter(CountersQpi, MetricQpiBand, s, false)); // Socket aggregate String^ t; for ( unsigned int j=0; jgetQPILinksPerSocket(); ++j ) { t = s + "_Link" + UInt32(j).ToString(); qpiHash_.Add(t, gcnew PerformanceCounter(CountersQpi, MetricQpiBand, t, false)); } } } // Create #system instances of the system specific performance counters, just kidding, there is only one system so 1 instance s = "Total_"; if (collectionInformation_->core) { ticksHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreClocktick, s, false)); instRetHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreRetired, s, false)); l2CacheMissHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreMissL2, s, false)); l3CacheMissHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreMissL3, s, false)); ipcHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreIpc, s, false)); baseTicksForIpcHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreBaseIpc, s, false)); relFreqHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreFreqRel, s, false)); baseTicksForRelFreqHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreFreqNom, s, false)); thermalHeadroomHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreHeadroom, s, false)); CoreC0StateResidencyHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreResC0, s, false)); CoreC3StateResidencyHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreResC3, s, false)); CoreC6StateResidencyHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreResC6, s, false)); CoreC7StateResidencyHash_.Add(s, gcnew PerformanceCounter(CountersCore, MetricCoreResC7, s, false)); } if (collectionInformation_->socket) { mrbHash_.Add(s, gcnew PerformanceCounter(CountersSocket, MetricSocketBandRead, s, false)); mwbHash_.Add(s, gcnew PerformanceCounter(CountersSocket, MetricSocketBandWrite, s, false)); packageEnergyHash_.Add(s, gcnew PerformanceCounter(CountersSocket, MetricSocketEnergyPack, s, false)); DRAMEnergyHash_.Add(s, gcnew PerformanceCounter(CountersSocket, MetricSocketEnergyDram, s, false)); PackageC2StateResidencyHash_.Add(s, gcnew PerformanceCounter(CountersSocket, MetricSocketResC2, s, false)); PackageC3StateResidencyHash_.Add(s, gcnew PerformanceCounter(CountersSocket, MetricSocketResC3, s, false)); PackageC6StateResidencyHash_.Add(s, gcnew PerformanceCounter(CountersSocket, MetricSocketResC6, s, false)); PackageC7StateResidencyHash_.Add(s, gcnew PerformanceCounter(CountersSocket, MetricSocketResC7, s, false)); } if (collectionInformation_->qpi) { qpiHash_.Add(s, gcnew PerformanceCounter(CountersQpi, MetricQpiBand, s, false)); } log_->WriteEntry(Globals::ServiceName, "All instances of the performance counter categories have been created."); } void doMeasurements( void ) { // FIXME: Do we care about hot swappability of CPUs? const size_t numSockets = m_->getNumSockets(); const size_t numCores = m_->getNumCores(); const size_t numQpiLinks = (size_t) m_->getQPILinksPerSocket(); // The structures SystemCounterState oldSystemState; SocketCounterState* oldSocketStates = new SocketCounterState[numSockets]; CoreCounterState* oldCoreStates = new CoreCounterState[numCores]; try { while (true) { Thread::Sleep(sampleRate_); // Fetch counter data here and store in the PerformanceCounter instances SystemCounterState systemState = getSystemCounterState(); // Set system performance counters String^ s = "Total_"; if (collectionInformation_->core) { __int64 totalTicks = getCycles(systemState); __int64 totalRefTicks = m_->getNominalFrequency() * numCores; __int64 totalInstr = getInstructionsRetired(systemState); ((PerformanceCounter^)ticksHash_[s])->RawValue = totalTicks; ((PerformanceCounter^)instRetHash_[s])->RawValue = totalInstr; ((PerformanceCounter^)l2CacheMissHash_[s])->IncrementBy(getL2CacheMisses(oldSystemState, systemState)); ((PerformanceCounter^)l3CacheMissHash_[s])->IncrementBy(getL3CacheMisses(oldSystemState, systemState)); ((PerformanceCounter^)ipcHash_[s])->RawValue = totalInstr >> 17; ((PerformanceCounter^)baseTicksForIpcHash_[s])->RawValue = totalTicks >> 17; ((PerformanceCounter^)relFreqHash_[s])->RawValue = totalTicks >> 17; ((PerformanceCounter^)baseTicksForRelFreqHash_[s])->IncrementBy(totalRefTicks >> 17); ((PerformanceCounter^)thermalHeadroomHash_[s])->RawValue = systemState.getThermalHeadroom(); ((PerformanceCounter^)CoreC0StateResidencyHash_[s])->RawValue = __int64(100.*getCoreCStateResidency(0,oldSystemState, systemState)); ((PerformanceCounter^)CoreC3StateResidencyHash_[s])->RawValue = __int64(100.*getCoreCStateResidency(3,oldSystemState, systemState)); ((PerformanceCounter^)CoreC6StateResidencyHash_[s])->RawValue = __int64(100.*getCoreCStateResidency(6,oldSystemState, systemState)); ((PerformanceCounter^)CoreC7StateResidencyHash_[s])->RawValue = __int64(100.*getCoreCStateResidency(7,oldSystemState, systemState)); //log_->WriteEntry(Globals::ServiceName, "Std: " + UInt64(totalTicks).ToString()); //log_->WriteEntry(Globals::ServiceName, "Ref: " + UInt64(totalRefTicks).ToString()); } if (collectionInformation_->socket) { ((PerformanceCounter^)mrbHash_[s])->RawValue = getBytesReadFromMC(oldSystemState, systemState); ((PerformanceCounter^)mwbHash_[s])->RawValue = getBytesWrittenToMC(oldSystemState, systemState); ((PerformanceCounter^)packageEnergyHash_[s])->RawValue = (__int64)getConsumedJoules(oldSystemState, systemState); ((PerformanceCounter^)DRAMEnergyHash_[s])->RawValue = (__int64)getDRAMConsumedJoules(oldSystemState, systemState); ((PerformanceCounter^)PackageC2StateResidencyHash_[s])->RawValue = __int64(100.*getPackageCStateResidency(2, oldSystemState, systemState)); ((PerformanceCounter^)PackageC3StateResidencyHash_[s])->RawValue = __int64(100.*getPackageCStateResidency(3, oldSystemState, systemState)); ((PerformanceCounter^)PackageC6StateResidencyHash_[s])->RawValue = __int64(100.*getPackageCStateResidency(6, oldSystemState, systemState)); ((PerformanceCounter^)PackageC7StateResidencyHash_[s])->RawValue = __int64(100.*getPackageCStateResidency(7, oldSystemState, systemState)); } if (collectionInformation_->qpi) { ((PerformanceCounter^)qpiHash_[s])->RawValue = getAllIncomingQPILinkBytes(systemState); } // Copy current state to old state oldSystemState = std::move( systemState ); // Set socket performance counters for ( unsigned int i = 0; i < numSockets; ++i ) { s = "Socket"+UInt32(i).ToString(); SocketCounterState socketState = getSocketCounterState(i); if (collectionInformation_->core) { __int64 socketTicks = getCycles(socketState); __int64 socketRefTicks = m_->getNominalFrequency()* numCores / numSockets; __int64 socketInstr = getInstructionsRetired(socketState); ((PerformanceCounter^)instRetHash_[s])->RawValue = socketInstr; ((PerformanceCounter^)ipcHash_[s])->RawValue = socketInstr >> 17; ((PerformanceCounter^)l2CacheMissHash_[s])->IncrementBy(getL2CacheMisses(oldSocketStates[i], socketState)); ((PerformanceCounter^)l3CacheMissHash_[s])->IncrementBy(getL3CacheMisses(oldSocketStates[i], socketState)); ((PerformanceCounter^)ticksHash_[s])->RawValue = socketTicks; ((PerformanceCounter^)baseTicksForIpcHash_[s])->RawValue = socketTicks >> 17; ((PerformanceCounter^)relFreqHash_[s])->RawValue = socketTicks >> 17; ((PerformanceCounter^)baseTicksForRelFreqHash_[s])->IncrementBy(socketRefTicks >> 17); ((PerformanceCounter^)thermalHeadroomHash_[s])->RawValue = socketState.getThermalHeadroom(); ((PerformanceCounter^)CoreC0StateResidencyHash_[s])->RawValue = __int64(100.*getCoreCStateResidency(0, oldSocketStates[i], socketState)); ((PerformanceCounter^)CoreC3StateResidencyHash_[s])->RawValue = __int64(100.*getCoreCStateResidency(3, oldSocketStates[i], socketState)); ((PerformanceCounter^)CoreC6StateResidencyHash_[s])->RawValue = __int64(100.*getCoreCStateResidency(6, oldSocketStates[i], socketState)); ((PerformanceCounter^)CoreC7StateResidencyHash_[s])->RawValue = __int64(100.*getCoreCStateResidency(7, oldSocketStates[i], socketState)); } if (collectionInformation_->socket) { ((PerformanceCounter^)mrbHash_[s])->RawValue = getBytesReadFromMC(oldSocketStates[i], socketState); ((PerformanceCounter^)mwbHash_[s])->RawValue = getBytesWrittenToMC(oldSocketStates[i], socketState); ((PerformanceCounter^)packageEnergyHash_[s])->RawValue = (__int64)getConsumedJoules(oldSocketStates[i], socketState); ((PerformanceCounter^)DRAMEnergyHash_[s])->RawValue = (__int64)getDRAMConsumedJoules(oldSocketStates[i], socketState); ((PerformanceCounter^)PackageC2StateResidencyHash_[s])->RawValue = __int64(100.*getPackageCStateResidency(2,oldSocketStates[i], socketState)); ((PerformanceCounter^)PackageC3StateResidencyHash_[s])->RawValue = __int64(100.*getPackageCStateResidency(3,oldSocketStates[i], socketState)); ((PerformanceCounter^)PackageC6StateResidencyHash_[s])->RawValue = __int64(100.*getPackageCStateResidency(6,oldSocketStates[i], socketState)); ((PerformanceCounter^)PackageC7StateResidencyHash_[s])->RawValue = __int64(100.*getPackageCStateResidency(7,oldSocketStates[i], socketState)); } if (collectionInformation_->qpi) { ((PerformanceCounter^)qpiHash_[s])->RawValue = getSocketIncomingQPILinkBytes(i, systemState); String^ t; // and qpi link counters per socket for ( unsigned int j=0; jRawValue = getIncomingQPILinkBytes(i, j, systemState); } } oldSocketStates[i] = std::move(socketState); } // Set core performance counters for ( unsigned int i = 0; i < numCores; ++i ) { s = UInt32(i).ToString(); CoreCounterState coreState = getCoreCounterState(i); if (collectionInformation_->core) { __int64 ticks = getCycles(coreState); __int64 refTicks = m_->getNominalFrequency(); __int64 instr = getInstructionsRetired(coreState); ((PerformanceCounter^)instRetHash_[s])->RawValue = instr; ((PerformanceCounter^)ipcHash_[s])->RawValue = instr >> 17; ((PerformanceCounter^)l2CacheMissHash_[s])->IncrementBy(getL2CacheMisses(oldCoreStates[i], coreState)); ((PerformanceCounter^)l3CacheMissHash_[s])->IncrementBy(getL3CacheMisses(oldCoreStates[i], coreState)); ((PerformanceCounter^)ticksHash_[s])->RawValue = ticks; ((PerformanceCounter^)baseTicksForIpcHash_[s])->RawValue = ticks >> 17; ((PerformanceCounter^)relFreqHash_[s])->RawValue = ticks >> 17; ((PerformanceCounter^)baseTicksForRelFreqHash_[s])->IncrementBy(refTicks >> 17); ((PerformanceCounter^)thermalHeadroomHash_[s])->RawValue = coreState.getThermalHeadroom(); ((PerformanceCounter^)CoreC0StateResidencyHash_[s])->RawValue = __int64(100.*getCoreCStateResidency(0,oldCoreStates[i], coreState)); ((PerformanceCounter^)CoreC3StateResidencyHash_[s])->RawValue = __int64(100.*getCoreCStateResidency(3,oldCoreStates[i], coreState)); ((PerformanceCounter^)CoreC6StateResidencyHash_[s])->RawValue = __int64(100.*getCoreCStateResidency(6,oldCoreStates[i], coreState)); ((PerformanceCounter^)CoreC7StateResidencyHash_[s])->RawValue = __int64(100.*getCoreCStateResidency(7,oldCoreStates[i], coreState)); } oldCoreStates[i] = std::move(coreState); } } } catch( ThreadAbortException^ ) { // We get here when for instance the service gets stopped or something bad happens. // In order to do our cleanup, like unprogram the MSRs, close the driver and such, in case we get stopped we want to execute normally after this // so this resets the abort and allows a normal exit Thread::ResetAbort(); } // Here we now have the chance to do cleanup after catching the ThreadAbortException because of the ResetAbort m_->cleanup(); delete[] oldSocketStates; delete[] oldCoreStates; } private: // Core counter hashtables System::Collections::Hashtable ticksHash_; System::Collections::Hashtable instRetHash_; System::Collections::Hashtable ipcHash_; System::Collections::Hashtable baseTicksForIpcHash_; System::Collections::Hashtable relFreqHash_; System::Collections::Hashtable baseTicksForRelFreqHash_; System::Collections::Hashtable l3CacheMissHash_; System::Collections::Hashtable l2CacheMissHash_; // Socket counter hashtables System::Collections::Hashtable mrbHash_; System::Collections::Hashtable mwbHash_; // QPI counter hashtables System::Collections::Hashtable qpiHash_; // Energy counters System::Collections::Hashtable packageEnergyHash_; System::Collections::Hashtable DRAMEnergyHash_; // Thermal headroom System::Collections::Hashtable thermalHeadroomHash_; // C-state Residencies System::Collections::Hashtable CoreC0StateResidencyHash_; System::Collections::Hashtable CoreC3StateResidencyHash_; System::Collections::Hashtable CoreC6StateResidencyHash_; System::Collections::Hashtable CoreC7StateResidencyHash_; System::Collections::Hashtable PackageC2StateResidencyHash_; System::Collections::Hashtable PackageC3StateResidencyHash_; System::Collections::Hashtable PackageC6StateResidencyHash_; System::Collections::Hashtable PackageC7StateResidencyHash_; System::Diagnostics::EventLog^ log_; PCM* m_; // Counter variable names initonly String^ CountersCore = gcnew String(L"PCM Core Counters"); initonly String^ CountersSocket = gcnew String(L"PCM Socket Counters"); initonly String^ CountersQpi = gcnew String(L"PCM QPI Counters"); initonly String^ MetricCoreClocktick = gcnew String(L"Clockticks"); initonly String^ MetricCoreRetired = gcnew String(L"Instructions Retired"); initonly String^ MetricCoreMissL2 = gcnew String(L"L2 Cache Misses"); initonly String^ MetricCoreMissL3 = gcnew String(L"L3 Cache Misses"); initonly String^ MetricCoreIpc = gcnew String(L"Instructions Per Clocktick (IPC)"); initonly String^ MetricCoreBaseIpc = gcnew String(L"Base ticks IPC"); initonly String^ MetricCoreFreqRel = gcnew String(L"Relative Frequency (%)"); initonly String^ MetricCoreFreqNom = gcnew String(L"Nominal Frequency"); initonly String^ MetricCoreHeadroom = gcnew String(L"Thermal Headroom below TjMax"); initonly String^ MetricCoreResC0 = gcnew String(L"core C0-state residency (%)"); initonly String^ MetricCoreResC3 = gcnew String(L"core C3-state residency (%)"); initonly String^ MetricCoreResC6 = gcnew String(L"core C6-state residency (%)"); initonly String^ MetricCoreResC7 = gcnew String(L"core C7-state residency (%)"); initonly String^ MetricSocketBandRead = gcnew String(L"Memory Read Bandwidth"); initonly String^ MetricSocketBandWrite = gcnew String(L"Memory Write Bandwidth"); initonly String^ MetricSocketEnergyPack = gcnew String(L"Package/Socket Consumed Energy"); initonly String^ MetricSocketEnergyDram = gcnew String(L"DRAM/Memory Consumed Energy"); initonly String^ MetricSocketResC2 = gcnew String(L"package C2-state residency (%)"); initonly String^ MetricSocketResC3 = gcnew String(L"package C3-state residency (%)"); initonly String^ MetricSocketResC6 = gcnew String(L"package C6-state residency (%)"); initonly String^ MetricSocketResC7 = gcnew String(L"package C7-state residency (%)"); initonly String^ MetricQpiBand = gcnew String(L"QPI Link Bandwidth"); // Configuration values const int sampleRate_; const CollectionInformation^ collectionInformation_; }; /// /// Summary for PMCService /// /// /// WARNING: If you change the name of this class, you will need to change the /// 'Resource File Name' property for the managed resource compiler tool /// associated with all .resx files this class depends on. Otherwise, /// the designers will not be able to interact properly with localized /// resources associated with this form. public ref class PCMService : public System::ServiceProcess::ServiceBase { [DllImport ("advapi32.dll")] static bool SetServiceStatus (IntPtr hServiceStatus, LPSERVICE_STATUS lpServiceStatus); private: void SetServiceFail (int ErrorCode) { SERVICE_STATUS ServiceStatus_; ServiceStatus_.dwCurrentState = (int)SERVICE_STOPPED; ServiceStatus_.dwServiceType = SERVICE_WIN32_OWN_PROCESS; ServiceStatus_.dwWaitHint = 0; ServiceStatus_.dwWin32ExitCode = ErrorCode; ServiceStatus_.dwServiceSpecificExitCode = 0; ServiceStatus_.dwCheckPoint = 0; ServiceStatus_.dwControlsAccepted = 0 | (this->CanStop ? (int) SERVICE_ACCEPT_STOP : 0) | (this->CanShutdown ? (int) SERVICE_ACCEPT_SHUTDOWN : 0) | (this->CanPauseAndContinue ? (int) SERVICE_ACCEPT_PAUSE_CONTINUE : 0) | (this->CanHandleSessionChangeEvent ? (int) SERVICE_ACCEPT_SESSIONCHANGE : 0) | (this->CanHandlePowerEvent ? (int) SERVICE_ACCEPT_POWEREVENT : 0); SetServiceStatus (this->ServiceHandle, &ServiceStatus_); } public: PCMService() { InitializeComponent(); // //TODO: Add the constructor code here // } protected: /// /// Clean up any resources being used. /// ~PCMService() { if (components) { delete components; } } /// /// Set things in motion so your service can do its work. /// virtual void OnStart(array^ args) override { // Default values for configuration int sampleRate = 1000; CollectionInformation^ collectionInformation = gcnew CollectionInformation(); // Read configuration values from registry HKEY hkey; if (ERROR_SUCCESS == RegOpenKeyEx(HKEY_LOCAL_MACHINE, L"SOFTWARE\\pcm\\service", NULL, KEY_READ, &hkey)) { DWORD regDWORD = static_cast(REG_DWORD); DWORD lenDWORD = 32; DWORD sampleRateRead(0); if (ERROR_SUCCESS == RegQueryValueEx(hkey, L"SampleRate", NULL, NULL, reinterpret_cast(&sampleRateRead), &lenDWORD)) { sampleRate = (int)sampleRateRead; } DWORD collectCoreRead(0); if (ERROR_SUCCESS == RegQueryValueEx(hkey, L"CollectCore", NULL, NULL, reinterpret_cast(&collectCoreRead), &lenDWORD)) { collectionInformation->core = (int)collectCoreRead > 0; } DWORD collectSocketRead(0); if (ERROR_SUCCESS == RegQueryValueEx(hkey, L"CollectSocket", NULL, NULL, reinterpret_cast(&collectSocketRead), &lenDWORD)) { collectionInformation->socket = (int)collectSocketRead > 0; } DWORD collectQpiRead(0); if (ERROR_SUCCESS == RegQueryValueEx(hkey, L"CollectQpi", NULL, NULL, reinterpret_cast(&collectQpiRead), &lenDWORD)) { collectionInformation->qpi = (int)collectQpiRead > 0; } RegCloseKey(hkey); } this->RequestAdditionalTime(4000); // We should open the driver here EventLog->WriteEntry(Globals::ServiceName, "Trying to start the driver...", EventLogEntryType::Information); drv_ = new Driver; if (!drv_->start()) { String^ s = gcnew String((L"Cannot open the driver.\nYou must have a signed driver at " + drv_->driverPath() + L" and have administrator rights to run this program.\n\n").c_str()); EventLog->WriteEntry(Globals::ServiceName, s, EventLogEntryType::Error); SetServiceFail(ERROR_FILE_NOT_FOUND); throw gcnew Exception(s); } // TODO: Add code here to start your service. MeasureThread^ mt; EventLog->WriteEntry(Globals::ServiceName, "Trying to create the measure thread...", EventLogEntryType::Information); try { mt = gcnew MeasureThread(EventLog, sampleRate, collectionInformation); } catch (Exception^ e) { EventLog->WriteEntry(Globals::ServiceName, e->Message, EventLogEntryType::Error); SetServiceFail(0x80886); throw e; } // Create thread, pretty obvious comment here workerThread_ = gcnew Thread( gcnew ThreadStart( mt, &MeasureThread::doMeasurements ) ); // Start timer/thread to read out registers and fill performance counter structures workerThread_->Start(); // EventLog->WriteEntry("PCMService", System::DateTime::Now.ToLongTimeString() + " Monitor could not initialize PMU, aborting.", EventLogEntryType::Error); } /// /// Stop this service. /// virtual void OnStop() override { // TODO: Add code here to perform any tear-down necessary to stop your service. this->RequestAdditionalTime(4000); // Stop timer/thread // doMeasurements will do cleanup itself, might have to do some sanity checks here workerThread_->Abort(); drv_->stop(); } private: /// /// Required designer variable. /// System::ComponentModel::Container ^components; System::Threading::Thread^ workerThread_; Driver* drv_; #pragma region Windows Form Designer generated code /// /// Required method for Designer support - do not modify /// the contents of this method with the code editor. /// void InitializeComponent(void) { // // PCMService // this->CanPauseAndContinue = true; this->ServiceName = Globals::ServiceName; } #pragma endregion }; }