mirror of
https://git.lyx.org/repos/lyx.git
synced 2024-12-16 18:03:49 +00:00
bdf3924fc7
This is more portable, and the old code prevented in windows to use instrument several classes at the same time (several .obj files, actually). No new feature here, bu the code is nicely slower. It might be less efficient, I am not really at ease with how std::chrono works.
227 lines
4.9 KiB
C++
227 lines
4.9 KiB
C++
// -*- C++ -*-
|
|
/* \file pmprof.h
|
|
* This file is part of LyX, the document processor.
|
|
* Licence details can be found in the file COPYING.
|
|
*
|
|
* \author Jean-Marc Lasgouttes
|
|
*
|
|
* Full author contact details are available in file CREDITS.
|
|
*/
|
|
|
|
/**
|
|
* ==== HOW TO USE THIS TRIVIAL PROFILER:
|
|
*
|
|
* * at the beginning of the interesting block, just add:
|
|
* PROFILE_THIS_BLOCK(some_identifier)
|
|
*
|
|
* A trailing semicolon can be added at your discretion.
|
|
*
|
|
* * when the program ends, statistics will be sent to standard error, like:
|
|
*
|
|
* #pmprof# some_identifier: 6.51usec, count=7120, total=46.33msec
|
|
*
|
|
* * It is also possible to profile caching schemes. All it takes is an additional
|
|
* PROFILE_CACHE_MISS(some_identifier)
|
|
* in the place that takes care of cache misses. Then the output at the end will change to
|
|
*
|
|
* #pmprof# some_identifier: 6.51usec, count=7120, total=46.33msec
|
|
* hit: 96%, 4.36usec, count=6849, total=29.89msec
|
|
* miss: 3%, 60.65usec, count=271, total=16.43msec
|
|
*
|
|
* * if DISABLE_PMPROF is defined before including pmprof.h, the
|
|
* profiler is replaced by empty macros. This is useful for quickly
|
|
* checking the overhead.
|
|
*
|
|
* ==== ABOUT PROFILING SCOPE:
|
|
*
|
|
* The code measured by the profiler corresponds to the lifetime of a
|
|
* local variable declared by the PROFILE_THIS_BLOCK macro.
|
|
*
|
|
* Some examples of profiling scope: In the snippets below, c1, c2...
|
|
* designate code chunks, and the identifiers of profiling blocks are
|
|
* chosen to reflect what they count.
|
|
*
|
|
* {
|
|
* c1
|
|
* PROFILE_THIS_BLOCK(c2)
|
|
* c2
|
|
* }
|
|
*
|
|
*
|
|
* {
|
|
* PROFILE_THIS_BLOCK(c1_c2)
|
|
* c1
|
|
* PROFILE_THIS_BLOCK(c2)
|
|
* c2
|
|
* }
|
|
*
|
|
*
|
|
* {
|
|
* {
|
|
* PROFILE_THIS_BLOCK(c1)
|
|
* c1
|
|
* }
|
|
* PROFILE_THIS_BLOCK(c2)
|
|
* c2
|
|
* }
|
|
*
|
|
*
|
|
* {
|
|
* PROFILE_THIS_BLOCK(c1_c2_c3)
|
|
* c1
|
|
* {
|
|
* PROFILE_THIS_BLOCK(c2)
|
|
* c2
|
|
* }
|
|
* c3
|
|
* }
|
|
*
|
|
* Influence of identifier names: they are mainly used for display
|
|
* purpose, but the same name should not be used twice in the same
|
|
* scope.
|
|
*
|
|
* {
|
|
* PROFILE_THIS_BLOCK(foo)
|
|
* c1
|
|
* PROFILE_THIS_BLOCK(foo) // error: identifier clash
|
|
* c2
|
|
* }
|
|
*
|
|
* In the example below, c1+c2 and c2 are counted separately, but in
|
|
* the output, both are confusingly labelled `foo'.
|
|
*
|
|
* {
|
|
* PROFILE_THIS_BLOCK(foo)
|
|
* c1
|
|
* {
|
|
* PROFILE_THIS_BLOCK(foo) // error: identifier clash
|
|
* c2
|
|
* }
|
|
* }
|
|
|
|
*/
|
|
|
|
#ifndef PMPROF_H
|
|
#define PMPROF_H
|
|
|
|
#if defined(DISABLE_PMPROF)
|
|
|
|
// Make pmprof an empty shell
|
|
#define PROFILE_THIS_BLOCK(a)
|
|
#define PROFILE_CACHE_MISS(a)
|
|
|
|
#else
|
|
|
|
#include <chrono>
|
|
#include <iomanip>
|
|
#include <iostream>
|
|
|
|
|
|
//#if defined(__GNUG__) && defined(_GLIBCXX_DEBUG)
|
|
//#error Profiling is not usable when run-time debugging is in effect
|
|
//#endif
|
|
|
|
namespace {
|
|
|
|
void dumpTime(std::chrono::duration<double> value)
|
|
{
|
|
double const val = value.count();
|
|
std::cerr << std::fixed << std::setprecision(2);
|
|
if (val >= 1.0)
|
|
std::cerr << val << " s";
|
|
else if (val >= 0.001)
|
|
std::cerr << val * 1000 << " ms";
|
|
else
|
|
std::cerr << val * 1000000 << " us";
|
|
}
|
|
|
|
void dump(std::chrono::duration<double> total, unsigned long long count) {
|
|
dumpTime(total / count);
|
|
std::cerr << ", count=" << count
|
|
<< ", total=";
|
|
dumpTime(total);
|
|
std::cerr << std::endl;
|
|
}
|
|
|
|
} // namespace
|
|
|
|
|
|
/* Helper class for gathering data. Instantiate this as a static
|
|
* variable, so that its destructor will be executed when the program
|
|
* ends.
|
|
*/
|
|
|
|
|
|
class PMProfStat {
|
|
public:
|
|
PMProfStat(char const * name) : name_(name), count_(0), miss_count_(0) {}
|
|
|
|
~PMProfStat() {
|
|
if (count_>0) {
|
|
if (miss_count_ == 0) {
|
|
std::cerr << "#pmprof# " << name_ << ": ";
|
|
dump(dur_, count_);
|
|
}
|
|
else {
|
|
std::cerr << "#pmprof# " << name_ << ": ";
|
|
dump(dur_ + miss_dur_, count_ + miss_count_);
|
|
std::cerr << " hit: " << 100 * count_ / (count_ + miss_count_) << "%, ";
|
|
dump(dur_, count_);
|
|
std::cerr << " miss: " << 100 * miss_count_ / (count_ + miss_count_) << "%, ";
|
|
dump(miss_dur_, miss_count_);
|
|
}
|
|
}
|
|
}
|
|
|
|
void add(std::chrono::duration<double> d, const bool hit) {
|
|
if (hit) {
|
|
dur_ += d;
|
|
count_++;
|
|
} else {
|
|
miss_dur_ += d;
|
|
miss_count_++;
|
|
}
|
|
}
|
|
|
|
private:
|
|
char const * name_;
|
|
std::chrono::duration<double> dur_, miss_dur_;
|
|
unsigned long long count_, miss_count_;
|
|
};
|
|
|
|
|
|
/* Helper class which gathers data at the end of the scope. One
|
|
* instance of this one should be created at each execution of the
|
|
* block. At the end of the block, it sends statistics to the static
|
|
* PMProfStat object.
|
|
*/
|
|
class PMProfInstance {
|
|
public:
|
|
PMProfInstance(PMProfStat * stat) : hit(true), stat_(stat)
|
|
{
|
|
before_ = std::chrono::system_clock::now();
|
|
}
|
|
|
|
~PMProfInstance() {
|
|
stat_->add(std::chrono::system_clock::now() - before_, hit);
|
|
}
|
|
|
|
bool hit;
|
|
|
|
private:
|
|
std::chrono::system_clock::time_point before_;
|
|
PMProfStat * stat_;
|
|
};
|
|
|
|
|
|
#define PROFILE_THIS_BLOCK(a) \
|
|
static PMProfStat PMPS_##a(#a);\
|
|
PMProfInstance PMPI_##a(&PMPS_##a);
|
|
|
|
#define PROFILE_CACHE_MISS(a) \
|
|
PMPI_##a.hit = false;
|
|
|
|
#endif // !defined(DISABLE_PMPROF)
|
|
|
|
#endif
|