mirror of
https://gitlab.com/libvirt/libvirt.git
synced 2025-01-03 11:35:19 +00:00
perf: add more perf events support
With current perf framework, this patch adds support and documentation for more perf events, including cache misses, cache references, cpu cycles, and instructions. Signed-off-by: Qiaowei Ren <qiaowei.ren@intel.com>
This commit is contained in:
parent
b00d7f298b
commit
bae660869d
@ -1922,6 +1922,10 @@
|
|||||||
<event name='cmt' enabled='yes'/>
|
<event name='cmt' enabled='yes'/>
|
||||||
<event name='mbmt' enabled='no'/>
|
<event name='mbmt' enabled='no'/>
|
||||||
<event name='mbml' enabled='yes'/>
|
<event name='mbml' enabled='yes'/>
|
||||||
|
<event name='cpu_cycles' enabled='no'/>
|
||||||
|
<event name='instructions' enabled='yes'/>
|
||||||
|
<event name='cache_references' enabled='no'/>
|
||||||
|
<event name='cache_misses' enabled='no'/>
|
||||||
</perf>
|
</perf>
|
||||||
...
|
...
|
||||||
</pre>
|
</pre>
|
||||||
@ -1947,6 +1951,26 @@
|
|||||||
<td>bandwidth of memory traffic for a memory controller</td>
|
<td>bandwidth of memory traffic for a memory controller</td>
|
||||||
<td><code>perf.mbml</code></td>
|
<td><code>perf.mbml</code></td>
|
||||||
</tr>
|
</tr>
|
||||||
|
<tr>
|
||||||
|
<td><code>cpu_cycles</code></td>
|
||||||
|
<td>the number of cpu cycles one instruction needs</td>
|
||||||
|
<td><code>perf.cpu_cycles</code></td>
|
||||||
|
</tr>
|
||||||
|
<tr>
|
||||||
|
<td><code>instructions</code></td>
|
||||||
|
<td>the count of instructions by applications running on the platform</td>
|
||||||
|
<td><code>perf.instructions</code></td>
|
||||||
|
</tr>
|
||||||
|
<tr>
|
||||||
|
<td><code>cache_references</code></td>
|
||||||
|
<td>the count of cache hits by applications running on the platform</td>
|
||||||
|
<td><code>perf.cache_references</code></td>
|
||||||
|
</tr>
|
||||||
|
<tr>
|
||||||
|
<td><code>cache_misses</code></td>
|
||||||
|
<td>the count of cache misses by applications running on the platform</td>
|
||||||
|
<td><code>perf.cache_misses</code></td>
|
||||||
|
</tr>
|
||||||
</table>
|
</table>
|
||||||
|
|
||||||
<h3><a name="elementsDevices">Devices</a></h3>
|
<h3><a name="elementsDevices">Devices</a></h3>
|
||||||
|
@ -422,6 +422,10 @@
|
|||||||
<value>cmt</value>
|
<value>cmt</value>
|
||||||
<value>mbmt</value>
|
<value>mbmt</value>
|
||||||
<value>mbml</value>
|
<value>mbml</value>
|
||||||
|
<value>cpu_cycles</value>
|
||||||
|
<value>instructions</value>
|
||||||
|
<value>cache_references</value>
|
||||||
|
<value>cache_misses</value>
|
||||||
</choice>
|
</choice>
|
||||||
</attribute>
|
</attribute>
|
||||||
<attribute name="enabled">
|
<attribute name="enabled">
|
||||||
|
@ -1972,6 +1972,45 @@ void virDomainStatsRecordListFree(virDomainStatsRecordPtr *stats);
|
|||||||
*/
|
*/
|
||||||
# define VIR_PERF_PARAM_MBML "mbml"
|
# define VIR_PERF_PARAM_MBML "mbml"
|
||||||
|
|
||||||
|
/**
|
||||||
|
* VIR_PERF_PARAM_CACHE_MISSES:
|
||||||
|
*
|
||||||
|
* Macro for typed parameter name that represents cache_misses perf
|
||||||
|
* event which can be used to measure the count of cache misses by
|
||||||
|
* applications running on the platform. It corresponds to the
|
||||||
|
* "perf.cache_misses" field in the *Stats APIs.
|
||||||
|
*/
|
||||||
|
# define VIR_PERF_PARAM_CACHE_MISSES "cache_misses"
|
||||||
|
|
||||||
|
/**
|
||||||
|
* VIR_PERF_PARAM_CACHE_REFERENCES:
|
||||||
|
*
|
||||||
|
* Macro for typed parameter name that represents cache_references
|
||||||
|
* perf event which can be used to measure the count of cache hits
|
||||||
|
* by applications running on the platform. It corresponds to the
|
||||||
|
* "perf.cache_references" field in the *Stats APIs.
|
||||||
|
*/
|
||||||
|
# define VIR_PERF_PARAM_CACHE_REFERENCES "cache_references"
|
||||||
|
|
||||||
|
/**
|
||||||
|
* VIR_PERF_PARAM_INSTRUCTIONS:
|
||||||
|
*
|
||||||
|
* Macro for typed parameter name that represents instructions perf
|
||||||
|
* event which can be used to measure the count of instructions
|
||||||
|
* by applications running on the platform. It corresponds to the
|
||||||
|
* "perf.instructions" field in the *Stats APIs.
|
||||||
|
*/
|
||||||
|
# define VIR_PERF_PARAM_INSTRUCTIONS "instructions"
|
||||||
|
|
||||||
|
/**
|
||||||
|
* VIR_PERF_PARAM_CPU_CYCLES:
|
||||||
|
*
|
||||||
|
* Macro for typed parameter name that represents cpu_cycles perf event
|
||||||
|
* which can be used to measure how many cpu cycles one instruction needs.
|
||||||
|
* It corresponds to the "perf.cpu_cycles" field in the *Stats APIs.
|
||||||
|
*/
|
||||||
|
# define VIR_PERF_PARAM_CPU_CYCLES "cpu_cycles"
|
||||||
|
|
||||||
int virDomainGetPerfEvents(virDomainPtr dom,
|
int virDomainGetPerfEvents(virDomainPtr dom,
|
||||||
virTypedParameterPtr *params,
|
virTypedParameterPtr *params,
|
||||||
int *nparams,
|
int *nparams,
|
||||||
|
@ -11457,6 +11457,15 @@ virConnectGetDomainCapabilities(virConnectPtr conn,
|
|||||||
* "perf.mbml" - the amount of data (bytes/s) sent through the memory controller
|
* "perf.mbml" - the amount of data (bytes/s) sent through the memory controller
|
||||||
* on the socket as unsigned long long. It is produced by mbml
|
* on the socket as unsigned long long. It is produced by mbml
|
||||||
* perf event.
|
* perf event.
|
||||||
|
* "perf.cache_misses" - the count of cache misses as unsigned long long.
|
||||||
|
* It is produced by cache_misses perf event.
|
||||||
|
* "perf.cache_references" - the count of cache hits as unsigned long long.
|
||||||
|
* It is produced by cache_references perf event.
|
||||||
|
* "perf.instructions" - The count of instructions as unsigned long long.
|
||||||
|
* It is produced by instructions perf event.
|
||||||
|
* "perf.cpu_cycles" - The number of cpu cycles one instruction needs as
|
||||||
|
* unsigned long long. It is produced by cpu_cycles
|
||||||
|
* perf event.
|
||||||
*
|
*
|
||||||
* Note that entire stats groups or individual stat fields may be missing from
|
* Note that entire stats groups or individual stat fields may be missing from
|
||||||
* the output in case they are not supported by the given hypervisor, are not
|
* the output in case they are not supported by the given hypervisor, are not
|
||||||
|
@ -9759,6 +9759,10 @@ qemuDomainSetPerfEvents(virDomainPtr dom,
|
|||||||
VIR_PERF_PARAM_CMT, VIR_TYPED_PARAM_BOOLEAN,
|
VIR_PERF_PARAM_CMT, VIR_TYPED_PARAM_BOOLEAN,
|
||||||
VIR_PERF_PARAM_MBMT, VIR_TYPED_PARAM_BOOLEAN,
|
VIR_PERF_PARAM_MBMT, VIR_TYPED_PARAM_BOOLEAN,
|
||||||
VIR_PERF_PARAM_MBML, VIR_TYPED_PARAM_BOOLEAN,
|
VIR_PERF_PARAM_MBML, VIR_TYPED_PARAM_BOOLEAN,
|
||||||
|
VIR_PERF_PARAM_CPU_CYCLES, VIR_TYPED_PARAM_BOOLEAN,
|
||||||
|
VIR_PERF_PARAM_INSTRUCTIONS, VIR_TYPED_PARAM_BOOLEAN,
|
||||||
|
VIR_PERF_PARAM_CACHE_REFERENCES, VIR_TYPED_PARAM_BOOLEAN,
|
||||||
|
VIR_PERF_PARAM_CACHE_MISSES, VIR_TYPED_PARAM_BOOLEAN,
|
||||||
NULL) < 0)
|
NULL) < 0)
|
||||||
return -1;
|
return -1;
|
||||||
|
|
||||||
|
@ -38,7 +38,9 @@ VIR_LOG_INIT("util.perf");
|
|||||||
#define VIR_FROM_THIS VIR_FROM_PERF
|
#define VIR_FROM_THIS VIR_FROM_PERF
|
||||||
|
|
||||||
VIR_ENUM_IMPL(virPerfEvent, VIR_PERF_EVENT_LAST,
|
VIR_ENUM_IMPL(virPerfEvent, VIR_PERF_EVENT_LAST,
|
||||||
"cmt", "mbmt", "mbml");
|
"cmt", "mbmt", "mbml",
|
||||||
|
"cpu_cycles", "instructions",
|
||||||
|
"cache_references", "cache_misses");
|
||||||
|
|
||||||
struct virPerfEvent {
|
struct virPerfEvent {
|
||||||
int type;
|
int type;
|
||||||
@ -71,6 +73,18 @@ static struct virPerfEventAttr attrs[] = {
|
|||||||
{.type = VIR_PERF_EVENT_CMT, .attrType = 0, .attrConfig = 1},
|
{.type = VIR_PERF_EVENT_CMT, .attrType = 0, .attrConfig = 1},
|
||||||
{.type = VIR_PERF_EVENT_MBMT, .attrType = 0, .attrConfig = 2},
|
{.type = VIR_PERF_EVENT_MBMT, .attrType = 0, .attrConfig = 2},
|
||||||
{.type = VIR_PERF_EVENT_MBML, .attrType = 0, .attrConfig = 3},
|
{.type = VIR_PERF_EVENT_MBML, .attrType = 0, .attrConfig = 3},
|
||||||
|
{.type = VIR_PERF_EVENT_CPU_CYCLES,
|
||||||
|
.attrType = PERF_TYPE_HARDWARE,
|
||||||
|
.attrConfig = PERF_COUNT_HW_CPU_CYCLES},
|
||||||
|
{.type = VIR_PERF_EVENT_INSTRUCTIONS,
|
||||||
|
.attrType = PERF_TYPE_HARDWARE,
|
||||||
|
.attrConfig = PERF_COUNT_HW_INSTRUCTIONS},
|
||||||
|
{.type = VIR_PERF_EVENT_CACHE_REFERENCES,
|
||||||
|
.attrType = PERF_TYPE_HARDWARE,
|
||||||
|
.attrConfig = PERF_COUNT_HW_CACHE_REFERENCES},
|
||||||
|
{.type = VIR_PERF_EVENT_CACHE_MISSES,
|
||||||
|
.attrType = PERF_TYPE_HARDWARE,
|
||||||
|
.attrConfig = PERF_COUNT_HW_CACHE_MISSES},
|
||||||
};
|
};
|
||||||
typedef struct virPerfEventAttr *virPerfEventAttrPtr;
|
typedef struct virPerfEventAttr *virPerfEventAttrPtr;
|
||||||
|
|
||||||
|
@ -32,6 +32,11 @@ typedef enum {
|
|||||||
VIR_PERF_EVENT_MBMT, /* Memory Bandwidth Monitoring Total */
|
VIR_PERF_EVENT_MBMT, /* Memory Bandwidth Monitoring Total */
|
||||||
VIR_PERF_EVENT_MBML, /* Memory Bandwidth Monitor Limit for controller */
|
VIR_PERF_EVENT_MBML, /* Memory Bandwidth Monitor Limit for controller */
|
||||||
|
|
||||||
|
VIR_PERF_EVENT_CPU_CYCLES, /* CPU Cycles per instruction */
|
||||||
|
VIR_PERF_EVENT_INSTRUCTIONS, /* Count of instructions for application */
|
||||||
|
VIR_PERF_EVENT_CACHE_REFERENCES, /* Cache hits by applications */
|
||||||
|
VIR_PERF_EVENT_CACHE_MISSES, /* Cache misses by applications */
|
||||||
|
|
||||||
VIR_PERF_EVENT_LAST
|
VIR_PERF_EVENT_LAST
|
||||||
} virPerfEventType;
|
} virPerfEventType;
|
||||||
|
|
||||||
|
@ -16,6 +16,10 @@
|
|||||||
<event name='cmt' enabled='yes'/>
|
<event name='cmt' enabled='yes'/>
|
||||||
<event name='mbmt' enabled='no'/>
|
<event name='mbmt' enabled='no'/>
|
||||||
<event name='mbml' enabled='yes'/>
|
<event name='mbml' enabled='yes'/>
|
||||||
|
<event name='cpu_cycles' enabled='no'/>
|
||||||
|
<event name='instructions' enabled='yes'/>
|
||||||
|
<event name='cache_references' enabled='no'/>
|
||||||
|
<event name='cache_misses' enabled='no'/>
|
||||||
</perf>
|
</perf>
|
||||||
<devices>
|
<devices>
|
||||||
</devices>
|
</devices>
|
||||||
|
@ -934,6 +934,10 @@ I<--perf> returns the statistics of all enabled perf events:
|
|||||||
"perf.cmt" - the cache usage in Byte currently used
|
"perf.cmt" - the cache usage in Byte currently used
|
||||||
"perf.mbmt" - total system bandwidth from one level of cache
|
"perf.mbmt" - total system bandwidth from one level of cache
|
||||||
"perf.mbml" - bandwidth of memory traffic for a memory controller
|
"perf.mbml" - bandwidth of memory traffic for a memory controller
|
||||||
|
"perf.cpu_cycles" - the number of cpu cycles one instruction needs
|
||||||
|
"perf.instructions" - the count of instructions
|
||||||
|
"perf.cache_references" - the count of cache hits
|
||||||
|
"perf.cache_misses" - the count of caches misses
|
||||||
|
|
||||||
See the B<perf> command for more details about each event.
|
See the B<perf> command for more details about each event.
|
||||||
|
|
||||||
@ -2237,6 +2241,15 @@ B<Valid perf event names>
|
|||||||
mbml - Provides a way to limit the amount of data
|
mbml - Provides a way to limit the amount of data
|
||||||
(bytes/s) send through the memory controller
|
(bytes/s) send through the memory controller
|
||||||
on the socket.
|
on the socket.
|
||||||
|
cache_misses - Provides the count of cache misses by
|
||||||
|
applications running on the platform.
|
||||||
|
cache_references - Provides the count of cache hits by
|
||||||
|
applications running on th e platform.
|
||||||
|
instructions - Provides the count of instructions executed
|
||||||
|
by applications running on the platform.
|
||||||
|
cpu_cycles - Provides the number of cpu_cycles for one
|
||||||
|
instruction. May be used with instructions
|
||||||
|
in order to get a cycles per instruction.
|
||||||
|
|
||||||
B<Note>: The statistics can be retrieved using the B<domstats> command using
|
B<Note>: The statistics can be retrieved using the B<domstats> command using
|
||||||
the I<--perf> flag.
|
the I<--perf> flag.
|
||||||
|
Loading…
Reference in New Issue
Block a user