Skip to content
GitLab
Projects
Groups
Snippets
/
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
Priyal Suneja
single-server-etrace
Commits
3220e838
Commit
3220e838
authored
Feb 25, 2022
by
Priyal Suneja
Browse files
added perf script
parent
d2a98685
Changes
99
Hide whitespace changes
Inline
Side-by-side
benchmarks/tests/msr/Makefile
View file @
3220e838
...
...
@@ -15,7 +15,7 @@ l1_populate: l1_populate.c utils.c msr.c
gcc
-O0
-Wall
-o
$(BUILDDIR)
/l1_populate l1_populate.c utils.c msr.c
-lm
l2_msr
:
l2_msr.c utils.c msr.c
gcc
-O0
-Wall
-o
$(BUILDDIR)
/l2_msr l2_msr.c utils.c msr.c
-lm
gcc
-O0
-g
-Wall
-o
$(BUILDDIR)
/l2_msr l2_msr.c utils.c msr.c
-lm
l2
:
l2.c utils.c msr.c
gcc
-O0
-Wall
-o
$(BUILDDIR)
/l2 l2.c utils.c msr.c
-lm
...
...
@@ -29,6 +29,9 @@ ins_msr: ins_msr.c msr.c utils.c
qs_msr
:
qs_msr.c msr.c utils.c
gcc
-O0
-Wall
-o
$(BUILDDIR)
/qs_msr qs_msr.c utils.c msr.c
-lm
mm_msr
:
mm_msr.c msr.c utils.c
gcc
-O0
-g
-Wall
-o
$(BUILDDIR)
/mm_msr mm_msr.c utils.c msr.c
-lm
ins
:
ins.c msr.c utils.c
gcc
-O0
-Wall
-o
$(BUILDDIR)
/ins ins.c msr.c utils.c
-lm
...
...
benchmarks/tests/msr/build/l1_msr
View file @
3220e838
No preview for this file type
benchmarks/tests/msr/build/l2_msr
View file @
3220e838
No preview for this file type
benchmarks/tests/msr/build/qs_msr
0 → 100755
View file @
3220e838
File added
benchmarks/tests/msr/l1_msr.c
View file @
3220e838
...
...
@@ -13,10 +13,16 @@ int measure_msr(int cpu_model, int cpu_info[3], double energy_units[2],
long
long
result
;
double
package_before
,
package_after
;
double
dram_before
,
dram_after
;
struct
ll
*
head
=
malloc
(
sizeof
(
struct
ll
));
struct
ll
*
curr
=
head
;
int
retval
=
populate_list
(
head
,
L1_LL_SIZE
);
// struct ll *head = malloc(sizeof(struct ll));
// struct ll *curr = head;
//
// int retval = populate_list(head, L1_LL_SIZE);
int
retval
;
int
arr
[
L1_LL_SIZE
];
for
(
int
i
=
0
;
i
<
L1_LL_SIZE
;
i
++
)
{
arr
[
i
]
=
L1_LL_SIZE
-
i
;
}
fd
=
open_msr
(
0
);
// todo: add package detection + map and stuff
...
...
@@ -36,10 +42,16 @@ int measure_msr(int cpu_model, int cpu_info[3], double energy_units[2],
close
(
fd
);
for
(
int
i
=
0
;
i
<
ITERATIONS_PER_RUN
;
i
++
)
{
while
(
curr
!=
NULL
)
{
curr
=
curr
->
next
;
int
index
=
0
;
while
(
index
<
L1_SIZE
)
{
int
j
=
index
;
for
(
j
;
j
<
L1_LL_SIZE
;
)
{
retval
+=
arr
[
j
];
j
+=
L1_SIZE
;
}
index
++
;
}
curr
=
head
;
}
fd
=
open_msr
(
0
);
...
...
benchmarks/tests/msr/l2_msr.c
View file @
3220e838
...
...
@@ -5,17 +5,19 @@
*/
#include
"msr.h"
int
measure_msr
(
int
cpu_model
,
int
cpu_info
[
3
],
double
energy_units
[
2
],
double
*
r1
,
double
*
r2
)
{
int
measure_msr
(
int
cpu_model
,
int
cpu_info
[
3
],
double
energy_units
[
2
],
double
*
r1
,
double
*
r2
)
{
int
dram_avail
=
2
;
int
fd
;
long
long
result
;
double
package_before
,
package_after
;
double
dram_before
,
dram_after
;
struct
ll
*
head
=
malloc
(
sizeof
(
struct
ll
));
struct
ll
*
curr
=
head
;
int
retval
=
0
;
int
retval
=
populate_list
(
head
,
L2_LL_SIZE
);
int
*
arr
=
malloc
(
L2_LL_SIZE
*
sizeof
(
int
));
for
(
int
i
=
0
;
i
<
L2_LL_SIZE
;
i
++
)
{
arr
[
i
]
=
L2_LL_SIZE
-
i
;
}
fd
=
open_msr
(
0
);
// todo: add package detection + map and stuff
...
...
@@ -35,10 +37,16 @@ int measure_msr(int cpu_model, int cpu_info[3], double energy_units[2],
close
(
fd
);
for
(
int
i
=
0
;
i
<
ITERATIONS_PER_RUN
;
i
++
)
{
while
(
curr
!=
NULL
)
{
curr
=
curr
->
next
;
int
index
=
0
;
while
(
index
<
L2_SIZE
)
{
int
j
=
index
;
for
(
j
;
j
<
L2_LL_SIZE
;)
{
retval
+=
arr
[
j
];
j
+=
L2_SIZE
;
}
index
++
;
}
curr
=
head
;
}
fd
=
open_msr
(
0
);
...
...
benchmarks/tests/msr/mm_msr.c
0 → 100644
View file @
3220e838
/*
* author: Priyal Suneja ; suneja@cs.washington.edu
*
* to run: sudo ./build/mm_msr
*/
#include
"msr.h"
void
matrix_multiply
(
int
one
[
MM_SIZE
][
MM_SIZE
],
int
two
[
MM_SIZE
][
MM_SIZE
],
int
result
[
MM_SIZE
][
MM_SIZE
])
{
int
rows1
=
MM_SIZE
;
int
cols2
=
MM_SIZE
;
int
common
=
MM_SIZE
;
//cols of 1 and rows of 2
for
(
int
rr
=
0
;
rr
<
rows1
;
rr
++
)
{
for
(
int
rc
=
0
;
rc
<
cols2
;
rc
++
)
{
result
[
rr
][
rc
]
=
0
;
}
}
for
(
int
i
=
0
;
i
<
rows1
;
i
++
)
{
for
(
int
j
=
0
;
j
<
cols2
;
j
++
)
{
for
(
int
k
=
0
;
k
<
common
;
k
++
)
{
result
[
i
][
j
]
+=
one
[
i
][
k
]
*
two
[
k
][
j
];
}
}
}
}
int
measure_msr
(
int
cpu_model
,
int
cpu_info
[
3
],
double
energy_units
[
2
],
double
*
r1
,
double
*
r2
)
{
int
dram_avail
=
2
;
int
fd
;
long
long
result
;
double
package_before
,
package_after
;
double
dram_before
,
dram_after
;
int
one
[
MM_SIZE
][
MM_SIZE
],
two
[
MM_SIZE
][
MM_SIZE
],
res
[
MM_SIZE
][
MM_SIZE
];
for
(
int
i
=
0
;
i
<
MM_SIZE
;
i
++
)
{
for
(
int
j
=
0
;
j
<
MM_SIZE
;
j
++
)
{
one
[
i
][
j
]
=
i
*
j
;
two
[
i
][
j
]
=
i
+
j
;
}
}
fd
=
open_msr
(
0
);
// todo: add package detection + map and stuff
/* Package Energy */
result
=
read_msr
(
fd
,
MSR_PKG_ENERGY_STATUS
);
package_before
=
(
double
)
result
*
energy_units
[
0
];
/* Updated documentation (but not the Vol3B) says Haswell and */
/* Broadwell have DRAM support too */
if
(
cpu_info
[
dram_avail
])
{
result
=
read_msr
(
fd
,
MSR_DRAM_ENERGY_STATUS
);
dram_before
=
(
double
)
result
*
energy_units
[
1
];
}
close
(
fd
);
for
(
int
i
=
0
;
i
<
ITERATIONS_PER_RUN
;
i
++
)
{
matrix_multiply
(
one
,
two
,
res
);
}
fd
=
open_msr
(
0
);
result
=
read_msr
(
fd
,
MSR_PKG_ENERGY_STATUS
);
package_after
=
(
double
)
result
*
energy_units
[
0
];
*
r1
=
package_after
-
package_before
;
if
(
cpu_info
[
dram_avail
])
{
result
=
read_msr
(
fd
,
MSR_DRAM_ENERGY_STATUS
);
dram_after
=
(
double
)
result
*
energy_units
[
1
];
*
r2
=
dram_after
-
dram_before
;
}
close
(
fd
);
// return retval;
return
1
;
}
int
main
(
int
argc
,
char
*
argv
[])
{
double
package_measure
[
RUNS
];
double
dram_measure
[
RUNS
];
int
cpu_info
[
3
];
// 0 -> pp0, 1-> pp1, 2-> dram
double
energy_units
[
2
];
// 0 -> cpu, 1 -> dram
get_cpu_info
(
CPU_HASWELL_EP
,
cpu_info
,
energy_units
);
printf
(
"---------------------------------------
\n
"
);
measure_msr
(
CPU_HASWELL_EP
,
cpu_info
,
energy_units
,
(
package_measure
+
0
),
(
dram_measure
+
0
));
print_avg
(
package_measure
,
RUNS
);
// print_avg(dram_measure);
return
0
;
}
benchmarks/tests/msr/msr.h
View file @
3220e838
...
...
@@ -16,14 +16,15 @@
#define RUNS 1
#define ITERATIONS_PER_RUN 1000
#define L1_SIZE
5*
32*1024
#define L2_SIZE
5*
256*1024
#define L1_SIZE 32*1024
#define L2_SIZE 256*1024
#define PAGE_SIZE 4*1024
#define TLB_ASSOC 4
#define TLB_ENTRIES 64
#define L1_LL_SIZE 5*L1_SIZE
#define L2_LL_SIZE
1
*L2_SIZE
#define L1_LL_SIZE
5*
5*L1_SIZE
#define L2_LL_SIZE
5*5
*L2_SIZE
#define TLB_LL_SIZE TLB_ASSOC*TLB_ENTRIES*8*10
#define MM_SIZE L1_SIZE/4
#define MSR_RAPL_POWER_UNIT 0x606
...
...
benchmarks/tests/msr/old_l1_msr.c
0 → 100644
View file @
3220e838
/*
* author: Priyal Suneja ; suneja@cs.washington.edu
*
* to run: sudo ./build/l1_msr
*/
#include
"msr.h"
int
measure_msr
(
int
cpu_model
,
int
cpu_info
[
3
],
double
energy_units
[
2
],
double
*
r1
,
double
*
r2
)
{
int
dram_avail
=
2
;
int
fd
;
long
long
result
;
double
package_before
,
package_after
;
double
dram_before
,
dram_after
;
struct
ll
*
head
=
malloc
(
sizeof
(
struct
ll
));
struct
ll
*
curr
=
head
;
int
retval
=
populate_list
(
head
,
L1_LL_SIZE
);
fd
=
open_msr
(
0
);
// todo: add package detection + map and stuff
/* Package Energy */
result
=
read_msr
(
fd
,
MSR_PKG_ENERGY_STATUS
);
package_before
=
(
double
)
result
*
energy_units
[
0
];
/* Updated documentation (but not the Vol3B) says Haswell and */
/* Broadwell have DRAM support too */
if
(
cpu_info
[
dram_avail
])
{
result
=
read_msr
(
fd
,
MSR_DRAM_ENERGY_STATUS
);
dram_before
=
(
double
)
result
*
energy_units
[
1
];
}
close
(
fd
);
for
(
int
i
=
0
;
i
<
ITERATIONS_PER_RUN
;
i
++
)
{
while
(
curr
!=
NULL
)
{
curr
=
curr
->
next
;
}
curr
=
head
;
}
fd
=
open_msr
(
0
);
result
=
read_msr
(
fd
,
MSR_PKG_ENERGY_STATUS
);
package_after
=
(
double
)
result
*
energy_units
[
0
];
*
r1
=
package_after
-
package_before
;
if
(
cpu_info
[
dram_avail
])
{
result
=
read_msr
(
fd
,
MSR_DRAM_ENERGY_STATUS
);
dram_after
=
(
double
)
result
*
energy_units
[
1
];
*
r2
=
dram_after
-
dram_before
;
}
close
(
fd
);
return
retval
;
}
int
main
(
int
argc
,
char
*
argv
[])
{
double
package_measure
[
RUNS
];
double
dram_measure
[
RUNS
];
int
cpu_info
[
3
];
// 0 -> pp0, 1-> pp1, 2-> dram
double
energy_units
[
2
];
// 0 -> cpu, 1 -> dram
get_cpu_info
(
CPU_HASWELL_EP
,
cpu_info
,
energy_units
);
printf
(
"---------------------------------------
\n
"
);
measure_msr
(
CPU_HASWELL_EP
,
cpu_info
,
energy_units
,
(
package_measure
+
0
),
(
dram_measure
+
0
));
print_avg
(
package_measure
,
RUNS
);
// print_avg(dram_measure);
return
0
;
}
benchmarks/tests/msr/old_l2_msr.c
0 → 100644
View file @
3220e838
/*
* author: Priyal Suneja ; suneja@cs.washington.edu
*
* to run: sudo ./build/l2_msr
*/
#include
"msr.h"
int
measure_msr
(
int
cpu_model
,
int
cpu_info
[
3
],
double
energy_units
[
2
],
double
*
r1
,
double
*
r2
)
{
int
dram_avail
=
2
;
int
fd
;
long
long
result
;
double
package_before
,
package_after
;
double
dram_before
,
dram_after
;
struct
ll
*
head
=
malloc
(
sizeof
(
struct
ll
));
struct
ll
*
curr
=
head
;
int
retval
=
populate_list
(
head
,
L2_LL_SIZE
);
fd
=
open_msr
(
0
);
// todo: add package detection + map and stuff
/* Package Energy */
result
=
read_msr
(
fd
,
MSR_PKG_ENERGY_STATUS
);
package_before
=
(
double
)
result
*
energy_units
[
0
];
/* Updated documentation (but not the Vol3B) says Haswell and */
/* Broadwell have DRAM support too */
if
(
cpu_info
[
dram_avail
])
{
result
=
read_msr
(
fd
,
MSR_DRAM_ENERGY_STATUS
);
dram_before
=
(
double
)
result
*
energy_units
[
1
];
}
close
(
fd
);
for
(
int
i
=
0
;
i
<
ITERATIONS_PER_RUN
;
i
++
)
{
while
(
curr
!=
NULL
)
{
curr
=
curr
->
next
;
}
curr
=
head
;
}
fd
=
open_msr
(
0
);
result
=
read_msr
(
fd
,
MSR_PKG_ENERGY_STATUS
);
package_after
=
(
double
)
result
*
energy_units
[
0
];
*
r1
=
package_after
-
package_before
;
if
(
cpu_info
[
dram_avail
])
{
result
=
read_msr
(
fd
,
MSR_DRAM_ENERGY_STATUS
);
dram_after
=
(
double
)
result
*
energy_units
[
1
];
*
r2
=
dram_after
-
dram_before
;
}
close
(
fd
);
return
retval
;
}
int
main
(
int
argc
,
char
*
argv
[])
{
double
package_measure
[
RUNS
];
double
dram_measure
[
RUNS
];
int
cpu_info
[
3
];
// 0 -> pp0, 1-> pp1, 2-> dram
double
energy_units
[
2
];
// 0 -> cpu, 1 -> dram
get_cpu_info
(
CPU_HASWELL_EP
,
cpu_info
,
energy_units
);
printf
(
"---------------------------------------
\n
"
);
// for(int i = 0; i < RUNS; i++) {
measure_msr
(
CPU_HASWELL_EP
,
cpu_info
,
energy_units
,
(
package_measure
+
0
),
(
dram_measure
+
0
));
// }
print_avg
(
package_measure
,
RUNS
);
// print_avg(dram_measure);
return
0
;
}
benchmarks/tests/msr/qs_msr.c
View file @
3220e838
...
...
@@ -24,7 +24,6 @@ int measure_msr(int cpu_model, int cpu_info[3], double energy_units[2],
qs_arr
[
L2_SIZE
-
i
]
=
i
;
}
fd
=
open_msr
(
0
);
// todo: add package detection + map and stuff
/* Package Energy */
...
...
@@ -42,7 +41,7 @@ int measure_msr(int cpu_model, int cpu_info[3], double energy_units[2],
close
(
fd
);
for
(
int
i
=
0
;
i
<
ITERATIONS_PER_RUN
;
i
++
)
{
qsort
(
qs_arr
,
L2_SIZE
,
int
(
qsor
t
),
cmpfnc
);
qsort
(
qs_arr
,
L2_SIZE
,
sizeof
(
in
t
),
cmpf
u
nc
);
}
fd
=
open_msr
(
0
);
...
...
@@ -59,7 +58,8 @@ int measure_msr(int cpu_model, int cpu_info[3], double energy_units[2],
}
close
(
fd
);
return
retval
;
// return retval;
return
1
;
}
...
...
calc.sh
View file @
3220e838
...
...
@@ -43,7 +43,7 @@ then
python3
${
a
[0]
}
/graph_relative_error.py
${
a
[4]
}
/graph_out_one
${
a
[4]
}
/ipc_input
fi
mkdir
${
a
[6]
}
mkdir
${
a
[6]
}
>
/dev/null
mv
${
a
[2]
}
output_table
*
.png
${
a
[6]
}
rm
-rf
${
a
[4]
}
data/bc
View file @
3220e838
********* bc *********
energy consumed: 1
7.105103
energy consumed: 1
8.268188
Performance counter stats for '/homes/sys/suneja/treehouse/single-server-etrace/benchmarks/gapbs/build/bc -g 10 -n 1':
1,
280,013
L1-icache-load-misses (4
0.0
5%)
5,957,208,261
cycles (53.
31
%)
3,906,564,912
cycle_activity.cycles_no_execute (5
4.58
%)
2,
353,367,718
instructions # 0.
40
insn per cycle (6
6.79
%)
1,
118,310
l2_rqsts.miss (6
8
.2
5
%)
3
47,481
dTLB-load-misses (
69.68
%)
2,
119,542
L1-dcache-load-misses (
70.4
9%)
42,203
iTLB-load-misses (5
5.98
%)
1,567
LLC-load-misses (
40.97
%)
1,
398,574
L1-icache-load-misses (4
1.3
5%)
6,190,266,273
cycles (53.
55
%)
4,098,361,581
cycle_activity.cycles_no_execute (5
5.93
%)
2,
444,308,374
instructions # 0.
39
insn per cycle (6
7.62
%)
1,
231,198
l2_rqsts.miss (6
9
.2
2
%)
3
23,928
dTLB-load-misses (
70.94
%)
2,
426,681
L1-dcache-load-misses (
69.7
9%)
35,632
iTLB-load-misses (5
3.40
%)
2,686
LLC-load-misses (
39.36
%)
0.1
73108112
seconds time elapsed
0.1
85722145
seconds time elapsed
data/bfs
View file @
3220e838
********* bfs *********
energy consumed: 12.
4
921
26
energy consumed: 12.
518
921
Performance counter stats for '/homes/sys/suneja/treehouse/single-server-etrace/benchmarks/gapbs/build/bfs -g 10 -n 1':
1,
108,723
L1-icache-load-misses (38.5
8
%)
4,
256,090,06
4 cycles (5
1.79
%)
2,8
20,788,119
cycle_activity.cycles_no_execute (5
5
.0
6
%)
1,
699,870,430
instructions # 0.40 insn per cycle (66.
50
%)
973,942
l2_rqsts.miss (
70.49
%)
2
25,176
dTLB-load-misses (
72.08
%)
1,
691,443
L1-dcache-load-misses (71.
50
%)
34,146
iTLB-load-misses (5
3
.3
7
%)
88
9 LLC-load-misses (
38.93
%)
1,
071,280
L1-icache-load-misses (38.
6
5%)
4,
307,324,59
4 cycles (5
0.40
%)
2,8
68,864,012
cycle_activity.cycles_no_execute (5
4
.0
8
%)
1,
713,426,262
instructions # 0.40 insn per cycle (66.
44
%)
1,043,593
l2_rqsts.miss (
67.20
%)
2
36,834
dTLB-load-misses (
69.27
%)
1,
838,491
L1-dcache-load-misses (71.
62
%)
25,868
iTLB-load-misses (5
6
.3
0
%)
2,64
9 LLC-load-misses (
42.88
%)
0.127
0
26
5
23 seconds time elapsed
0.12
8
72623
4
seconds time elapsed
data/cc
View file @
3220e838
********* cc *********
energy consumed: 11.
870361
energy consumed: 11.
676025
Performance counter stats for '/homes/sys/suneja/treehouse/single-server-etrace/benchmarks/gapbs/build/cc -g 10 -n 1':
1,0
52,401
L1-icache-load-misses (38.
78
%)
4,01
0,943,992
cycles (
51
.8
3
%)
2,64
2,775,05
2 cycle_activity.cycles_no_execute (5
5.34
%)
1,
604,789,365
instructions # 0.40 insn per cycle (6
8.06
%)
769,580
l2_rqsts.miss (6
9.25
%)
1
83,421
dTLB-load-misses (
70.36
%)
1,5
69,755
L1-dcache-load-misses (7
1.51
%)
2
7,965
iTLB-load-misses (5
4
.3
4
%)
621
LLC-load-misses (4
0.43
%)
1,0
49,290
L1-icache-load-misses (38.
22
%)
4,01
8,704,957
cycles (
49
.8
4
%)
2,64
9,330,69
2 cycle_activity.cycles_no_execute (5
1.75
%)
1,
597,239,477
instructions # 0.40 insn per cycle (6
3.41
%)
912,903
l2_rqsts.miss (6
5.80
%)
1
45,763
dTLB-load-misses (
69.54
%)
1,5
50,234
L1-dcache-load-misses (7
4.39
%)
2
1,449
iTLB-load-misses (5
7
.3
2
%)
389
LLC-load-misses (4
2.98
%)
0.121
917271
seconds time elapsed
0.121
783479
seconds time elapsed
data/cc_sv
View file @
3220e838
********* cc_sv *********
energy consumed: 1
2.25921
6
energy consumed: 1
1.39776
6
Performance counter stats for '/homes/sys/suneja/treehouse/single-server-etrace/benchmarks/gapbs/build/cc_sv -g 10 -n 1':
1,0
72,745
L1-icache-load-misses (
38.1
9%)
4,082,037,613
cycles (5
0.62
%)
2,
674,615,1
41 cycle_activity.cycles_no_execute (53.
20
%)
1,63
0,538,924
instructions # 0.40 insn per cycle (6
5.65
%)
910,821
l2_rqsts.miss (6
9.1
3%)
17
9,548
dTLB-load-misses (
72.39
%)
1,
526,14
4 L1-dcache-load-misses (71.
92
%)
23,7
77
iTLB-load-misses (5
5.82
%)
1,334
LLC-load-misses (
39.35
%)
1,0
88,443
L1-icache-load-misses (
40.3
9%)
3,921,869,128
cycles (5
3.09
%)
2,
581,254,
41
3
cycle_activity.cycles_no_execute (53.
35
%)
1,
5
63
,640,369
instructions # 0.40 insn per cycle (6
6.49
%)
889,677
l2_rqsts.miss (6
8.0
3%)
17
6,630
dTLB-load-misses (
68.23
%)
1,
635,70
4 L1-dcache-load-misses (71.
85
%)
23,7
25
iTLB-load-misses (5
6.33
%)
471
LLC-load-misses (
41.82
%)
0.1
25100855
seconds time elapsed
0.1
16843799
seconds time elapsed
data/err_bfs_10
View file @
3220e838
********* graph500 *********
energy consumed:
5306.928711
energy consumed:
9446.554016
Performance counter stats for 'mpirun --allow-run-as-root --mca orte_base_help_aggregate 0 /homes/sys/suneja/treehouse/single-server-etrace/benchmarks/graph500/build/err_bfs 10':
57,505,330
L1-icache-load-misses (44.4
7
%)
1,
066,815,891,182
cycles (55.5
8
%)
525,134,753,42
5 cycle_activity.cycles_no_execute (55.5
6
%)
867,362,244,260
instructions # 0.8
1
insn per cycle (66.66%)
6
2,
625,29
7 l2_rqsts.miss (66.6
4
%)
3,464,834
dTLB-load-misses (66.6
4
%)
141,176,835
L1-dcache-load-misses (66.6
6
%)
2,595,349
iTLB-load-misses (55.56%)
663,912
LLC-load-misses (44.4
7
%)
84,386,768
L1-icache-load-misses (44.4
4
%)
1,
903,679,492,119
cycles (55.5
5
%)
941,000,533,58
5 cycle_activity.cycles_no_execute (55.5
5
%)
1,526,777,735,404
instructions # 0.8
0
insn per cycle (66.66%)
8
2,
773,03
7 l2_rqsts.miss (66.6
6
%)
6,097,256
dTLB-load-misses (66.6
7
%)
231,543,598
L1-dcache-load-misses (66.6
7
%)
4,953,584
iTLB-load-misses (55.56%)
700,451
LLC-load-misses (44.4
4
%)
5
1.
242779
15
6
seconds time elapsed
9
1.
182001
15
9
seconds time elapsed
data/err_bfs_5
View file @
3220e838
********* graph500 *********
energy consumed:
2396.366150
energy consumed:
1210.031494
Performance counter stats for 'mpirun --allow-run-as-root --mca orte_base_help_aggregate 0 /homes/sys/suneja/treehouse/single-server-etrace/benchmarks/graph500/build/err_bfs 5':
2
7,875,712
L1-icache-load-misses (44.
4
0%)
484,571,530,485
cycles (55.
50
%)
242,228,828,226
cycle_activity.cycles_no_execute (55.52%)
376,769,298,968
instructions # 0.7
8
insn per cycle (66.6
6
%)
40,247,386
l2_rqsts.miss (66.6
7
%)
2,
317,000
dTLB-load-misses (66.
6
9%)
90,245,854
L1-dcache-load-misses (66.
70
%)
1,
513,399
iTLB-load-misses (55.
59
%)
576,917
LLC-load-misses (44.
43
%)
2
2,279,424
L1-icache-load-misses (44.
5
0%)
247,684,672,026
cycles (55.
61
%)
126,604,996,271
cycle_activity.cycles_no_execute (55.52%)
178,710,216,603
instructions # 0.7
2
insn per cycle (66.6
0
%)
29,491,315
l2_rqsts.miss (66.6
0
%)
2,
250,612
dTLB-load-misses (66.
5
9%)
52,137,220
L1-dcache-load-misses (66.
66
%)
1,
453,774
iTLB-load-misses (55.
62
%)
609,794
LLC-load-misses (44.
52
%)
23.504193532
seconds time elapsed
12.276787029
seconds time elapsed
data/err_bfs_7
View file @
3220e838
********* graph500 *********
energy consumed:
3501.399292
energy consumed:
7163.584167