blob: bdfe68c3fc9c6bfc7c1c9c7d95842d10d1e30578 [file] [log] [blame]
Jim Cownie4cc4bb42014-10-07 16:25:50 +00001/** @file kmp_stats_timing.cpp
2 * Timing functions
3 */
4
Jim Cownie4cc4bb42014-10-07 16:25:50 +00005//===----------------------------------------------------------------------===//
6//
Chandler Carruth57b08b02019-01-19 10:56:40 +00007// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
8// See https://llvm.org/LICENSE.txt for license information.
9// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
Jim Cownie4cc4bb42014-10-07 16:25:50 +000010//
11//===----------------------------------------------------------------------===//
12
Jim Cownie4cc4bb42014-10-07 16:25:50 +000013#include <stdlib.h>
14#include <unistd.h>
15
Jim Cownie4cc4bb42014-10-07 16:25:50 +000016#include <iomanip>
Jonathan Peyton30419822017-05-12 18:01:32 +000017#include <iostream>
Jim Cownie4cc4bb42014-10-07 16:25:50 +000018#include <sstream>
19
Jonathan Peytonf7413122015-12-17 16:58:26 +000020#include "kmp.h"
Jim Cownie4cc4bb42014-10-07 16:25:50 +000021#include "kmp_stats_timing.h"
22
23using namespace std;
24
Jonathan Peyton8b524592015-12-17 17:27:51 +000025#if KMP_HAVE_TICK_TIME
Jonathan Peyton30419822017-05-12 18:01:32 +000026#if KMP_MIC
27double tsc_tick_count::tick_time() {
28 // pretty bad assumption of 1GHz clock for MIC
29 return 1 / ((double)1000 * 1.e6);
Jim Cownie4cc4bb42014-10-07 16:25:50 +000030}
Jonathan Peyton30419822017-05-12 18:01:32 +000031#elif KMP_ARCH_X86 || KMP_ARCH_X86_64
32#include <string.h>
Jim Cownie4cc4bb42014-10-07 16:25:50 +000033// Extract the value from the CPUID information
Jonathan Peyton30419822017-05-12 18:01:32 +000034double tsc_tick_count::tick_time() {
35 static double result = 0.0;
Jim Cownie4cc4bb42014-10-07 16:25:50 +000036
Jonathan Peyton30419822017-05-12 18:01:32 +000037 if (result == 0.0) {
38 kmp_cpuid_t cpuinfo;
39 char brand[256];
Jim Cownie4cc4bb42014-10-07 16:25:50 +000040
Jonathan Peyton30419822017-05-12 18:01:32 +000041 __kmp_x86_cpuid(0x80000000, 0, &cpuinfo);
42 memset(brand, 0, sizeof(brand));
43 int ids = cpuinfo.eax;
Jim Cownie4cc4bb42014-10-07 16:25:50 +000044
Jonathan Peyton30419822017-05-12 18:01:32 +000045 for (unsigned int i = 2; i < (ids ^ 0x80000000) + 2; i++)
46 __kmp_x86_cpuid(i | 0x80000000, 0,
47 (kmp_cpuid_t *)(brand + (i - 2) * sizeof(kmp_cpuid_t)));
Jim Cownie4cc4bb42014-10-07 16:25:50 +000048
Jonathan Peyton30419822017-05-12 18:01:32 +000049 char *start = &brand[0];
50 for (; *start == ' '; start++)
51 ;
Jonathan Peyton072772b2016-04-05 18:48:48 +000052
Jonathan Peyton30419822017-05-12 18:01:32 +000053 char *end = brand + KMP_STRLEN(brand) - 3;
54 uint64_t multiplier;
Jim Cownie4cc4bb42014-10-07 16:25:50 +000055
Jonathan Peyton30419822017-05-12 18:01:32 +000056 if (*end == 'M')
57 multiplier = 1000LL * 1000LL;
58 else if (*end == 'G')
59 multiplier = 1000LL * 1000LL * 1000LL;
60 else if (*end == 'T')
61 multiplier = 1000LL * 1000LL * 1000LL * 1000LL;
62 else {
63 cout << "Error determining multiplier '" << *end << "'\n";
64 exit(-1);
Jim Cownie4cc4bb42014-10-07 16:25:50 +000065 }
Jonathan Peyton30419822017-05-12 18:01:32 +000066 *end = 0;
67 while (*end != ' ')
68 end--;
69 end++;
70
71 double freq = strtod(end, &start);
72 if (freq == 0.0) {
73 cout << "Error calculating frequency " << end << "\n";
74 exit(-1);
75 }
76
77 result = ((double)1.0) / (freq * multiplier);
78 }
79 return result;
Jim Cownie4cc4bb42014-10-07 16:25:50 +000080}
Jonathan Peyton30419822017-05-12 18:01:32 +000081#endif
Jim Cownie4cc4bb42014-10-07 16:25:50 +000082#endif
83
84static bool useSI = true;
85
86// Return a formatted string after normalising the value into
87// engineering style and using a suitable unit prefix (e.g. ms, us, ns).
Jonathan Peyton30419822017-05-12 18:01:32 +000088std::string formatSI(double interval, int width, char unit) {
89 std::stringstream os;
Jim Cownie4cc4bb42014-10-07 16:25:50 +000090
Jonathan Peyton30419822017-05-12 18:01:32 +000091 if (useSI) {
92 // Preserve accuracy for small numbers, since we only multiply and the
93 // positive powers of ten are precisely representable.
94 static struct {
95 double scale;
96 char prefix;
Jonathan Peytonf0682ac2018-07-30 17:41:08 +000097 } ranges[] = {{1.e21, 'y'}, {1.e18, 'z'}, {1.e15, 'a'}, {1.e12, 'f'},
98 {1.e9, 'p'}, {1.e6, 'n'}, {1.e3, 'u'}, {1.0, 'm'},
99 {1.e-3, ' '}, {1.e-6, 'k'}, {1.e-9, 'M'}, {1.e-12, 'G'},
100 {1.e-15, 'T'}, {1.e-18, 'P'}, {1.e-21, 'E'}, {1.e-24, 'Z'},
101 {1.e-27, 'Y'}};
Jonathan Peyton072772b2016-04-05 18:48:48 +0000102
Jonathan Peyton30419822017-05-12 18:01:32 +0000103 if (interval == 0.0) {
104 os << std::setw(width - 3) << std::right << "0.00" << std::setw(3)
105 << unit;
106 return os.str();
Jim Cownie4cc4bb42014-10-07 16:25:50 +0000107 }
Jim Cownie4cc4bb42014-10-07 16:25:50 +0000108
Jonathan Peyton30419822017-05-12 18:01:32 +0000109 bool negative = false;
110 if (interval < 0.0) {
111 negative = true;
112 interval = -interval;
113 }
114
115 for (int i = 0; i < (int)(sizeof(ranges) / sizeof(ranges[0])); i++) {
116 if (interval * ranges[i].scale < 1.e0) {
117 interval = interval * 1000.e0 * ranges[i].scale;
118 os << std::fixed << std::setprecision(2) << std::setw(width - 3)
119 << std::right << (negative ? -interval : interval) << std::setw(2)
120 << ranges[i].prefix << std::setw(1) << unit;
121
122 return os.str();
123 }
124 }
125 }
126 os << std::setprecision(2) << std::fixed << std::right << std::setw(width - 3)
127 << interval << std::setw(3) << unit;
128
129 return os.str();
Jim Cownie4cc4bb42014-10-07 16:25:50 +0000130}