summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorXianyi Zhang <xianyi@iscas.ac.cn>2011-06-09 10:40:15 +0800
committerXianyi Zhang <xianyi@iscas.ac.cn>2011-06-09 10:40:15 +0800
commit149638322434c90ba7fafb48312a08d1634144dd (patch)
tree71ead2924bc6fd3fcce7fcaa9d3808d5db7f3080
parent4335bca2f7265193186771c5b1cc4f6b177c85b8 (diff)
downloadopenblas-149638322434c90ba7fafb48312a08d1634144dd.tar.gz
openblas-149638322434c90ba7fafb48312a08d1634144dd.tar.bz2
openblas-149638322434c90ba7fafb48312a08d1634144dd.zip
Print the wall time (cycles) with enabling FUNCTION_PROFILE.
-rw-r--r--Changelog.txt1
-rw-r--r--driver/others/profile.c9
-rwxr-xr-x[-rw-r--r--]interface/create0
3 files changed, 6 insertions, 4 deletions
diff --git a/Changelog.txt b/Changelog.txt
index c4e6a8fe2..cc90ee198 100644
--- a/Changelog.txt
+++ b/Changelog.txt
@@ -18,6 +18,7 @@ common:
* Added openblas_set_num_threads for Fortran.
* Fixed #25 a wrong result of rotmg.
* Fixed a bug about detecting underscore prefix in c_check.
+ * Print the wall time (cycles) with enabling FUNCTION_PROFILE
x86/x86_64:
* Fixed #28 a wrong result of dsdot on x86_64.
diff --git a/driver/others/profile.c b/driver/others/profile.c
index f65550c9f..f464c0b6a 100644
--- a/driver/others/profile.c
+++ b/driver/others/profile.c
@@ -74,20 +74,21 @@ void gotoblas_profile_quit(void) {
if (cycles > 0) {
fprintf(stderr, "\n\t====== BLAS Profiling Result =======\n\n");
- fprintf(stderr, " Function No. of Calls Time Consumption Efficiency Bytes/cycle\n");
+ fprintf(stderr, " Function No. of Calls Time Consumption Efficiency Bytes/cycle Wall Time(Cycles)\n");
for (i = 0; i < MAX_PROF_TABLE; i ++) {
if (function_profile_table[i].calls) {
#ifndef OS_WINDOWS
- fprintf(stderr, "%-12s : %10Ld %8.2f%% %10.3f%% %8.2f\n",
+ fprintf(stderr, "%-12s : %10Ld %8.2f%% %10.3f%% %8.2f %Ld\n",
#else
- fprintf(stderr, "%-12s : %10lld %8.2f%% %10.3f%% %8.2f\n",
+ fprintf(stderr, "%-12s : %10lld %8.2f%% %10.3f%% %8.2f %lld\n",
#endif
func_table[i],
function_profile_table[i].calls,
(double)function_profile_table[i].cycles / (double)cycles * 100.,
(double)function_profile_table[i].fops / (double)function_profile_table[i].tcycles * 100.,
- (double)function_profile_table[i].area / (double)function_profile_table[i].cycles
+ (double)function_profile_table[i].area / (double)function_profile_table[i].cycles,
+ function_profile_table[i].cycles
);
}
}
diff --git a/interface/create b/interface/create
index b7be8ab6e..b7be8ab6e 100644..100755
--- a/interface/create
+++ b/interface/create