mirror of
https://github.com/KhronosGroup/SPIRV-Tools
synced 2025-01-03 21:51:05 +00:00
388 lines
14 KiB
C
388 lines
14 KiB
C
|
// Copyright (c) 2018 Google LLC.
|
||
|
//
|
||
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
||
|
// you may not use this file except in compliance with the License.
|
||
|
// You may obtain a copy of the License at
|
||
|
//
|
||
|
// http://www.apache.org/licenses/LICENSE-2.0
|
||
|
//
|
||
|
// Unless required by applicable law or agreed to in writing, software
|
||
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
||
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||
|
// See the License for the specific language governing permissions and
|
||
|
// limitations under the License.
|
||
|
|
||
|
// Contains utils for getting resource utilization
|
||
|
|
||
|
#ifndef LIBSPIRV_UTIL_TIMER_H_
|
||
|
#define LIBSPIRV_UTIL_TIMER_H_
|
||
|
|
||
|
#if defined(SPIRV_TIMER_ENABLED)
|
||
|
|
||
|
#include <sys/resource.h>
|
||
|
#include <cassert>
|
||
|
#include <iostream>
|
||
|
|
||
|
// A macro to call spvutils::PrintTimerDescription(std::ostream*, bool). The
|
||
|
// first argument must be given as std::ostream*. If it is NULL, the function
|
||
|
// does nothing. Otherwise, it prints resource types measured by Timer class.
|
||
|
// The second is optional and if it is true, the function also prints resource
|
||
|
// type fields related to memory. Otherwise, it does not print memory related
|
||
|
// fields. Its default is false. In usual, this must be placed before calling
|
||
|
// Timer::Report() to inform what those fields printed by Timer::Report()
|
||
|
// indicate (or spvutils::PrintTimerDescription() must be used instead).
|
||
|
#define SPIRV_TIMER_DESCRIPTION(...) \
|
||
|
spvutils::PrintTimerDescription(__VA_ARGS__)
|
||
|
|
||
|
// Creates an object of ScopedTimer to measure the resource utilization for the
|
||
|
// scope surrounding it as the following example:
|
||
|
//
|
||
|
// { // <-- beginning of this scope
|
||
|
//
|
||
|
// /* ... code out of interest ... */
|
||
|
//
|
||
|
// SPIRV_TIMER_SCOPED(std::cout, tag);
|
||
|
//
|
||
|
// /* ... lines of code that we want to know its resource usage ... */
|
||
|
//
|
||
|
// } // <-- end of this scope. The destructor of ScopedTimer prints tag and
|
||
|
// the resource utilization to std::cout.
|
||
|
#define SPIRV_TIMER_SCOPED(...) \
|
||
|
spvutils::ScopedTimer<spvutils::Timer> timer##__LINE__(__VA_ARGS__)
|
||
|
|
||
|
namespace spvutils {
|
||
|
|
||
|
// Prints the description of resource types measured by Timer class. If |out| is
|
||
|
// NULL, it does nothing. Otherwise, it prints resource types. The second is
|
||
|
// optional and if it is true, the function also prints resource type fields
|
||
|
// related to memory. Its default is false. In usual, this must be placed before
|
||
|
// calling Timer::Report() to inform what those fields printed by
|
||
|
// Timer::Report() indicate.
|
||
|
void PrintTimerDescription(std::ostream*, bool = false);
|
||
|
|
||
|
// Status of Timer. kGetrusageFailed means it failed in calling getrusage().
|
||
|
// kClockGettimeWalltimeFailed means it failed in getting wall time when calling
|
||
|
// clock_gettime(). kClockGettimeCPUtimeFailed means it failed in getting CPU
|
||
|
// time when calling clock_gettime().
|
||
|
enum UsageStatus {
|
||
|
kSucceeded = 0,
|
||
|
kGetrusageFailed = 1 << 0,
|
||
|
kClockGettimeWalltimeFailed = 1 << 1,
|
||
|
kClockGettimeCPUtimeFailed = 1 << 2,
|
||
|
};
|
||
|
|
||
|
// Timer measures the resource utilization for a range of code. The resource
|
||
|
// utilization consists of CPU time (i.e., process time), WALL time (elapsed
|
||
|
// time), USR time, SYS time, RSS delta, and the delta of the number of page
|
||
|
// faults. RSS delta and the delta of the number of page faults are measured
|
||
|
// only when |measure_mem_usage| given to the constructor is true. This class
|
||
|
// should be used as the following example:
|
||
|
//
|
||
|
// spvutils::Timer timer(std::cout);
|
||
|
// timer.Start(); // <-- set |usage_before_|, |wall_before_|,
|
||
|
// and |cpu_before_|
|
||
|
//
|
||
|
// /* ... lines of code that we want to know its resource usage ... */
|
||
|
//
|
||
|
// timer.Stop(); // <-- set |cpu_after_|, |wall_after_|, and
|
||
|
// |usage_after_|
|
||
|
// timer.Report(tag); // <-- print tag and the resource utilization to
|
||
|
// std::cout.
|
||
|
class Timer {
|
||
|
public:
|
||
|
Timer(std::ostream* out, bool measure_mem_usage = false)
|
||
|
: report_stream_(out),
|
||
|
usage_status_(kSucceeded),
|
||
|
measure_mem_usage_(measure_mem_usage) {}
|
||
|
|
||
|
// Sets |usage_before_|, |wall_before_|, and |cpu_before_| as results of
|
||
|
// getrusage(), clock_gettime() for the wall time, and clock_gettime() for the
|
||
|
// CPU time respectively. Note that this method erases all previous state of
|
||
|
// |usage_before_|, |wall_before_|, |cpu_before_|.
|
||
|
virtual void Start();
|
||
|
|
||
|
// Sets |cpu_after_|, |wall_after_|, and |usage_after_| as results of
|
||
|
// clock_gettime() for the wall time, and clock_gettime() for the CPU time,
|
||
|
// getrusage() respectively. Note that this method erases all previous state
|
||
|
// of |cpu_after_|, |wall_after_|, |usage_after_|.
|
||
|
virtual void Stop();
|
||
|
|
||
|
// If |report_stream_| is NULL, it does nothing. Otherwise, it prints the
|
||
|
// resource utilization (i.e., CPU/WALL/USR/SYS time, RSS delta) between the
|
||
|
// time of calling Timer::Start() and the time of calling Timer::Stop(). If we
|
||
|
// cannot get a resource usage because of failures, it prints "Failed" instead
|
||
|
// for the resource.
|
||
|
void Report(const char* tag);
|
||
|
|
||
|
// Returns the measured CPU Time (i.e., process time) for a range of code
|
||
|
// execution. If kClockGettimeCPUtimeFailed is set by the failure of calling
|
||
|
// clock_gettime(), it returns -1.
|
||
|
virtual double CPUTime() {
|
||
|
if (usage_status_ & kClockGettimeCPUtimeFailed) return -1;
|
||
|
return TimeDifference(cpu_before_, cpu_after_);
|
||
|
}
|
||
|
|
||
|
// Returns the measured Wall Time (i.e., elapsed time) for a range of code
|
||
|
// execution. If kClockGettimeWalltimeFailed is set by the failure of
|
||
|
// calling clock_gettime(), it returns -1.
|
||
|
virtual double WallTime() {
|
||
|
if (usage_status_ & kClockGettimeWalltimeFailed) return -1;
|
||
|
return TimeDifference(wall_before_, wall_after_);
|
||
|
}
|
||
|
|
||
|
// Returns the measured USR Time for a range of code execution. If
|
||
|
// kGetrusageFailed is set because of the failure of calling getrusage(), it
|
||
|
// returns -1.
|
||
|
virtual double UserTime() {
|
||
|
if (usage_status_ & kGetrusageFailed) return -1;
|
||
|
return TimeDifference(usage_before_.ru_utime, usage_after_.ru_utime);
|
||
|
}
|
||
|
|
||
|
// Returns the measured SYS Time for a range of code execution. If
|
||
|
// kGetrusageFailed is set because of the failure of calling getrusage(), it
|
||
|
// returns -1.
|
||
|
virtual double SystemTime() {
|
||
|
if (usage_status_ & kGetrusageFailed) return -1;
|
||
|
return TimeDifference(usage_before_.ru_stime, usage_after_.ru_stime);
|
||
|
}
|
||
|
|
||
|
// Returns the measured RSS delta for a range of code execution. If
|
||
|
// kGetrusageFailed is set because of the failure of calling getrusage(), it
|
||
|
// returns -1.
|
||
|
virtual long RSS() const {
|
||
|
if (usage_status_ & kGetrusageFailed) return -1;
|
||
|
return usage_after_.ru_maxrss - usage_before_.ru_maxrss;
|
||
|
}
|
||
|
|
||
|
// Returns the measured the delta of the number of page faults for a range of
|
||
|
// code execution. If kGetrusageFailed is set because of the failure of
|
||
|
// calling getrusage(), it returns -1.
|
||
|
virtual long PageFault() const {
|
||
|
if (usage_status_ & kGetrusageFailed) return -1;
|
||
|
return (usage_after_.ru_minflt - usage_before_.ru_minflt) +
|
||
|
(usage_after_.ru_majflt - usage_before_.ru_majflt);
|
||
|
}
|
||
|
|
||
|
virtual ~Timer() {}
|
||
|
|
||
|
private:
|
||
|
// Returns the time gap between |from| and |to| in seconds.
|
||
|
static double TimeDifference(const timeval& from, const timeval& to) {
|
||
|
assert((to.tv_sec > from.tv_sec) ||
|
||
|
(to.tv_sec == from.tv_sec && to.tv_usec >= from.tv_usec));
|
||
|
return static_cast<double>(to.tv_sec - from.tv_sec) +
|
||
|
static_cast<double>(to.tv_usec - from.tv_usec) * .000001;
|
||
|
}
|
||
|
|
||
|
// Returns the time gap between |from| and |to| in seconds.
|
||
|
static double TimeDifference(const timespec& from, const timespec& to) {
|
||
|
assert((to.tv_sec > from.tv_sec) ||
|
||
|
(to.tv_sec == from.tv_sec && to.tv_nsec >= from.tv_nsec));
|
||
|
return static_cast<double>(to.tv_sec - from.tv_sec) +
|
||
|
static_cast<double>(to.tv_nsec - from.tv_nsec) * .000000001;
|
||
|
}
|
||
|
|
||
|
// Output stream to print out the resource utilization. If it is NULL,
|
||
|
// Report() does nothing.
|
||
|
std::ostream* report_stream_;
|
||
|
|
||
|
// Status to stop measurement if a system call returns an error.
|
||
|
unsigned usage_status_;
|
||
|
|
||
|
// Variable to save the result of clock_gettime(CLOCK_PROCESS_CPUTIME_ID) when
|
||
|
// Timer::Start() is called. It is used as the base status of CPU time.
|
||
|
timespec cpu_before_;
|
||
|
|
||
|
// Variable to save the result of clock_gettime(CLOCK_MONOTONIC) when
|
||
|
// Timer::Start() is called. It is used as the base status of WALL time.
|
||
|
timespec wall_before_;
|
||
|
|
||
|
// Variable to save the result of getrusage() when Timer::Start() is called.
|
||
|
// It is used as the base status of USR time, SYS time, and RSS.
|
||
|
rusage usage_before_;
|
||
|
|
||
|
// Variable to save the result of clock_gettime(CLOCK_PROCESS_CPUTIME_ID) when
|
||
|
// Timer::Stop() is called. It is used as the last status of CPU time. The
|
||
|
// resouce usage is measured by subtracting |cpu_before_| from it.
|
||
|
timespec cpu_after_;
|
||
|
|
||
|
// Variable to save the result of clock_gettime(CLOCK_MONOTONIC) when
|
||
|
// Timer::Stop() is called. It is used as the last status of WALL time. The
|
||
|
// resouce usage is measured by subtracting |wall_before_| from it.
|
||
|
timespec wall_after_;
|
||
|
|
||
|
// Variable to save the result of getrusage() when Timer::Stop() is called. It
|
||
|
// is used as the last status of USR time, SYS time, and RSS. Those resouce
|
||
|
// usages are measured by subtracting |usage_before_| from it.
|
||
|
rusage usage_after_;
|
||
|
|
||
|
// If true, Timer reports the memory usage information too. Otherwise, Timer
|
||
|
// reports only USR time, WALL time, SYS time.
|
||
|
bool measure_mem_usage_;
|
||
|
};
|
||
|
|
||
|
// The purpose of ScopedTimer is to measure the resource utilization for a
|
||
|
// scope. Simply creating a local variable of ScopedTimer will call
|
||
|
// Timer::Start() and it calls Timer::Stop() and Timer::Report() at the end of
|
||
|
// the scope by its destructor. When we use this class, we must choose the
|
||
|
// proper Timer class (for class TimerType template) in advance. This class
|
||
|
// should be used as the following example:
|
||
|
//
|
||
|
// { // <-- beginning of this scope
|
||
|
//
|
||
|
// /* ... code out of interest ... */
|
||
|
//
|
||
|
// spvutils::ScopedTimer<spvutils::Timer> scopedtimer(std::cout, tag);
|
||
|
//
|
||
|
// /* ... lines of code that we want to know its resource usage ... */
|
||
|
//
|
||
|
// } // <-- end of this scope. The destructor of ScopedTimer prints tag and
|
||
|
// the resource utilization to std::cout.
|
||
|
//
|
||
|
// The template<class TimerType> is used to choose a Timer class. Currently,
|
||
|
// only options for the Timer class are Timer and MockTimer in the unit test.
|
||
|
template <class TimerType>
|
||
|
class ScopedTimer {
|
||
|
public:
|
||
|
ScopedTimer(std::ostream* out, const char* tag,
|
||
|
bool measure_mem_usage = false)
|
||
|
: timer(new TimerType(out, measure_mem_usage)), tag_(tag) {
|
||
|
timer->Start();
|
||
|
}
|
||
|
|
||
|
// At the end of the scope surrounding the instance of this class, this
|
||
|
// destructor saves the last status of resource usage and reports it.
|
||
|
virtual ~ScopedTimer() {
|
||
|
timer->Stop();
|
||
|
timer->Report(tag_);
|
||
|
delete timer;
|
||
|
}
|
||
|
|
||
|
private:
|
||
|
// Actual timer that measures the resource utilization. It must be an instance
|
||
|
// of Timer class if there is no special reason to use other class.
|
||
|
TimerType* timer;
|
||
|
|
||
|
// A tag that will be printed in front of the trace reported by Timer class.
|
||
|
const char* tag_;
|
||
|
};
|
||
|
|
||
|
// CumulativeTimer is the same as Timer class, but it supports a cumulative
|
||
|
// measurement as the following example:
|
||
|
//
|
||
|
// CumulativeTimer *ctimer = new CumulativeTimer(std::cout);
|
||
|
// ctimer->Start();
|
||
|
//
|
||
|
// /* ... lines of code that we want to know its resource usage ... */
|
||
|
//
|
||
|
// ctimer->Stop();
|
||
|
//
|
||
|
// /* ... code out of interest ... */
|
||
|
//
|
||
|
// ctimer->Start();
|
||
|
//
|
||
|
// /* ... lines of code that we want to know its resource usage ... */
|
||
|
//
|
||
|
// ctimer->Stop();
|
||
|
// ctimer->Report(tag);
|
||
|
// delete ctimer;
|
||
|
//
|
||
|
class CumulativeTimer : public Timer {
|
||
|
public:
|
||
|
CumulativeTimer(std::ostream* out, bool measure_mem_usage = false)
|
||
|
: Timer(out, measure_mem_usage),
|
||
|
cpu_time_(0),
|
||
|
wall_time_(0),
|
||
|
usr_time_(0),
|
||
|
sys_time_(0),
|
||
|
rss_(0),
|
||
|
pgfaults_(0) {}
|
||
|
|
||
|
// If we cannot get a resource usage because of failures, it sets -1 for the
|
||
|
// resource usage.
|
||
|
void Stop() override {
|
||
|
Timer::Stop();
|
||
|
|
||
|
if (cpu_time_ >= 0 && Timer::CPUTime() >= 0)
|
||
|
cpu_time_ += Timer::CPUTime();
|
||
|
else
|
||
|
cpu_time_ = -1;
|
||
|
|
||
|
if (wall_time_ >= 0 && Timer::WallTime() >= 0)
|
||
|
wall_time_ += Timer::WallTime();
|
||
|
else
|
||
|
wall_time_ = -1;
|
||
|
|
||
|
if (usr_time_ >= 0 && Timer::UserTime() >= 0)
|
||
|
usr_time_ += Timer::UserTime();
|
||
|
else
|
||
|
usr_time_ = -1;
|
||
|
|
||
|
if (sys_time_ >= 0 && Timer::SystemTime() >= 0)
|
||
|
sys_time_ += Timer::SystemTime();
|
||
|
else
|
||
|
sys_time_ = -1;
|
||
|
|
||
|
if (rss_ >= 0 && Timer::RSS() >= 0)
|
||
|
rss_ += Timer::RSS();
|
||
|
else
|
||
|
rss_ = -1;
|
||
|
|
||
|
if (pgfaults_ >= 0 && Timer::PageFault() >= 0)
|
||
|
pgfaults_ += Timer::PageFault();
|
||
|
else
|
||
|
pgfaults_ = -1;
|
||
|
}
|
||
|
|
||
|
// Returns the cumulative CPU Time (i.e., process time) for a range of code
|
||
|
// execution.
|
||
|
double CPUTime() override { return cpu_time_; }
|
||
|
|
||
|
// Returns the cumulative Wall Time (i.e., elapsed time) for a range of code
|
||
|
// execution.
|
||
|
double WallTime() override { return wall_time_; }
|
||
|
|
||
|
// Returns the cumulative USR Time for a range of code execution.
|
||
|
double UserTime() override { return usr_time_; }
|
||
|
|
||
|
// Returns the cumulative SYS Time for a range of code execution.
|
||
|
double SystemTime() override { return sys_time_; }
|
||
|
|
||
|
// Returns the cumulative RSS delta for a range of code execution.
|
||
|
long RSS() const override { return rss_; }
|
||
|
|
||
|
// Returns the cumulative delta of number of page faults for a range of code
|
||
|
// execution.
|
||
|
long PageFault() const override { return pgfaults_; }
|
||
|
|
||
|
private:
|
||
|
// Variable to save the cumulative CPU time (i.e., process time).
|
||
|
double cpu_time_;
|
||
|
|
||
|
// Variable to save the cumulative wall time (i.e., elapsed time).
|
||
|
double wall_time_;
|
||
|
|
||
|
// Variable to save the cumulative user time.
|
||
|
double usr_time_;
|
||
|
|
||
|
// Variable to save the cumulative system time.
|
||
|
double sys_time_;
|
||
|
|
||
|
// Variable to save the cumulative RSS delta.
|
||
|
long rss_;
|
||
|
|
||
|
// Variable to save the cumulative delta of the number of page faults.
|
||
|
long pgfaults_;
|
||
|
};
|
||
|
|
||
|
} // namespace spvutils
|
||
|
|
||
|
#else // defined(SPIRV_TIMER_ENABLED)
|
||
|
|
||
|
#define SPIRV_TIMER_DESCRIPTION(...)
|
||
|
#define SPIRV_TIMER_SCOPED(...)
|
||
|
|
||
|
#endif // defined(SPIRV_TIMER_ENABLED)
|
||
|
|
||
|
#endif // LIBSPIRV_UTIL_TIMER_H_
|