-
Notifications
You must be signed in to change notification settings - Fork 32
/
Copy pathbandwidth.c
executable file
·236 lines (211 loc) · 6.16 KB
/
bandwidth.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
/**
*
* Copyright (C) 2012 Heechul Yun <[email protected]>
* 2012 Zheng <[email protected]>
*
* This file is distributed under the University of Illinois Open Source
* License. See LICENSE.TXT for details.
*
*/
/* clang -S -mllvm --x86-asm-syntax=intel ./bandwidth.c */
/**************************************************************************
* Conditional Compilation Options
**************************************************************************/
/**************************************************************************
* Included Files
**************************************************************************/
#define _GNU_SOURCE /* See feature_test_macros(7) */
#include <sched.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <signal.h>
#include <unistd.h>
#include <inttypes.h>
#include <sys/mman.h>
#include <sys/types.h>
#include <fcntl.h>
#include <errno.h>
#include <sys/time.h>
#include <sys/resource.h>
/**************************************************************************
* Public Definitions
**************************************************************************/
#define CACHE_LINE_SIZE 64 /* cache Line size is 64 byte */
#ifdef __arm__
# define DEFAULT_ALLOC_SIZE_KB 4096
#else
# define DEFAULT_ALLOC_SIZE_KB 16384
#endif
/**************************************************************************
* Public Types
**************************************************************************/
enum access_type { READ, WRITE};
/**************************************************************************
* Global Variables
**************************************************************************/
int g_mem_size = DEFAULT_ALLOC_SIZE_KB * 1024; /* memory size */
int *g_mem_ptr = 0; /* pointer to allocated memory region */
volatile uint64_t g_nread = 0; /* number of bytes read */
volatile unsigned int g_start; /* starting time */
int cpuid = 0;
/**************************************************************************
* Public Functions
**************************************************************************/
unsigned int get_usecs()
{
struct timeval time;
gettimeofday(&time, NULL);
return (time.tv_sec * 1000000 + time.tv_usec);
}
void quit(int param)
{
float dur_in_sec;
float bw;
float dur = get_usecs() - g_start;
dur_in_sec = (float)dur / 1000000;
printf("g_nread(bytes read) = %lld\n", (long long)g_nread);
printf("elapsed = %.2f sec ( %.0f usec )\n", dur_in_sec, dur);
bw = (float)g_nread / dur_in_sec / 1024 / 1024;
printf("CPU%d: B/W = %.2f MB/s | ",cpuid, bw);
printf("CPU%d: average = %.2f ns\n", cpuid, (dur*1000)/(g_nread/CACHE_LINE_SIZE));
exit(0);
}
int64_t bench_read()
{
int i;
int64_t sum = 0;
for ( i = 0; i < g_mem_size/4; i+=(CACHE_LINE_SIZE/4) ) {
sum += g_mem_ptr[i];
}
g_nread += g_mem_size;
return sum;
}
int bench_write()
{
register int i;
for ( i = 0; i < g_mem_size/4; i+=(CACHE_LINE_SIZE/4) ) {
g_mem_ptr[i] = i;
}
g_nread += g_mem_size;
return 1;
}
void usage(int argc, char *argv[])
{
printf("Usage: $ %s [<option>]*\n\n", argv[0]);
printf("-m: memory size in KB. deafult=8192\n");
printf("-a: access type - read, write. default=read\n");
printf("-n: addressing pattern - Seq, Row, Bank. default=Seq\n");
printf("-t: time to run in sec. 0 means indefinite. default=5. \n");
printf("-c: CPU to run.\n");
printf("-i: iterations. 0 means intefinite. default=0\n");
printf("-p: priority\n");
printf("-l: log label. use together with -f\n");
printf("-f: log file name\n");
printf("-h: help\n");
printf("\nExamples: \n$ bandwidth -m 8192 -a read -t 1 -c 2\n <- 8MB read for 1 second on CPU 2\n");
exit(1);
}
int main(int argc, char *argv[])
{
int64_t sum = 0;
unsigned finish = 5;
int prio = 0;
int num_processors;
int acc_type = READ;
int opt;
cpu_set_t cmask;
int iterations = 0;
int i;
struct sched_param param;
/*
* get command line options
*/
while ((opt = getopt(argc, argv, "m:a:n:t:c:i:p:r:f:l:xh")) != -1) {
switch (opt) {
case 'm': /* set memory size */
g_mem_size = 1024 * strtol(optarg, NULL, 0);
break;
case 'a': /* set access type */
if (!strcmp(optarg, "read"))
acc_type = READ;
else if (!strcmp(optarg, "write"))
acc_type = WRITE;
else
exit(1);
break;
case 't': /* set time in secs to run */
finish = strtol(optarg, NULL, 0);
break;
case 'c': /* set CPU affinity */
cpuid = strtol(optarg, NULL, 0);
num_processors = sysconf(_SC_NPROCESSORS_CONF);
CPU_ZERO(&cmask);
CPU_SET(cpuid % num_processors, &cmask);
if (sched_setaffinity(0, num_processors, &cmask) < 0)
perror("error");
else
fprintf(stderr, "assigned to cpu %d\n", cpuid);
break;
case 'r':
prio = strtol(optarg, NULL, 0);
param.sched_priority = prio; /* 1(low)- 99(high) for SCHED_FIFO or SCHED_RR
0 for SCHED_OTHER or SCHED_BATCH */
if(sched_setscheduler(0, SCHED_FIFO, ¶m) == -1) {
perror("sched_setscheduler failed");
}
break;
case 'p': /* set priority */
prio = strtol(optarg, NULL, 0);
if (setpriority(PRIO_PROCESS, 0, prio) < 0)
perror("error");
else
fprintf(stderr, "assigned priority %d\n", prio);
break;
case 'i': /* iterations */
iterations = strtol(optarg, NULL, 0);
break;
case 'h':
usage(argc, argv);
break;
}
}
/*
* allocate contiguous region of memory
*/
g_mem_ptr = (int *)malloc(g_mem_size);
memset((char *)g_mem_ptr, 1, g_mem_size);
for (i = 0; i < g_mem_size / sizeof(int); i++)
g_mem_ptr[i] = i;
/* print experiment info before starting */
printf("memsize=%d KB, type=%s, cpuid=%d\n",
g_mem_size/1024,
((acc_type==READ) ?"read": "write"),
cpuid);
printf("stop at %d\n", finish);
/* set signals to terminate once time has been reached */
signal(SIGINT, &quit);
if (finish > 0) {
signal(SIGALRM, &quit);
alarm(finish);
}
/*
* actual memory access
*/
g_start = get_usecs();
for (i=0;; i++) {
switch (acc_type) {
case READ:
sum += bench_read();
break;
case WRITE:
sum += bench_write();
break;
}
if (iterations > 0 && i >= iterations)
break;
}
printf("total sum = %ld\n", (long)sum);
quit(0);
return 0;
}