Skip to content

Commit b3d9838

Browse files
abhaumickJRPanmkhairytgrogers
authored
Small changes for compatibility, added Atomics uBench app groups (#106)
* Update latency config * Added app groups for atomic benchmarking - Collection of GPU Atomic uBench - Additional app groups for profiling * Changes to allow python2 compatibility - `from __future__ import print_function` * fixes to run_simulations,py - added arguments passed to command in justrun file - pipes out console output to a text file --------- Co-authored-by: JRPAN <[email protected]> Co-authored-by: mkhairy <[email protected]> Co-authored-by: Tim Rogers <[email protected]>
1 parent d21201f commit b3d9838

File tree

3 files changed

+228
-4
lines changed

3 files changed

+228
-4
lines changed

util/hw_stats/run_hw.py

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -29,7 +29,7 @@
2929
# ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
3030
# POSSIBILITY OF SUCH DAMAGE.
3131

32-
32+
from __future__ import print_function
3333
from optparse import OptionParser
3434
import os
3535
import subprocess
@@ -206,7 +206,9 @@
206206
+ cuda_version
207207
+ '"; export CUDA_VISIBLE_DEVICES="'
208208
+ options.device_num
209-
+ '" ; timeout 30m nvprof --concurrent-kernels off --print-gpu-trace -u us --metrics all --demangling off --csv --log-file '
209+
+ '" ; timeout 30m nvprof --concurrent-kernels off --print-gpu-trace -u us --metrics all,'
210+
+ 'atomic_throughput,atomic_transactions,atomic_transactions_per_request,l2_atomic_throughput,l2_atomic_transactions,global_atomic_requests '
211+
+ '--demangling off --csv --log-file '
210212
+ os.path.join(this_run_dir, logfile)
211213
+ " "
212214
+ exec_path

util/job_launching/apps/define-all-apps.yml

Lines changed: 221 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -112,6 +112,227 @@ GPU_Microbenchmark:
112112
- args:
113113
accel-sim-mem: 1G
114114

115+
GPU_Atomic:
116+
exec_dir: "$GPUAPPS_ROOT/bin/$CUDA_VERSION/release/"
117+
data_dirs: "$GPUAPPS_ROOT/data_dirs/"
118+
execs:
119+
- atomic_add_bw:
120+
- args:
121+
accel-sim-mem: 1G
122+
- atomic_add_bw_conflict:
123+
- args:
124+
accel-sim-mem: 1G
125+
- atomic_add_bw_profile:
126+
- args: 16
127+
accel-sim-mem: 1G
128+
- atomic_add_bw_diverge:
129+
- args: 16
130+
accel-sim-mem: 1G
131+
132+
Atomic_Profile:
133+
exec_dir: "$GPUAPPS_ROOT/bin/$CUDA_VERSION/release/"
134+
data_dirs: "$GPUAPPS_ROOT/data_dirs/"
135+
execs:
136+
- atomic_add_bw_profile:
137+
- args: 32
138+
accel-sim-mem: 1G
139+
- atomic_add_bw_profile:
140+
- args: 31
141+
accel-sim-mem: 1G
142+
- atomic_add_bw_profile:
143+
- args: 30
144+
accel-sim-mem: 1G
145+
- atomic_add_bw_profile:
146+
- args: 29
147+
accel-sim-mem: 1G
148+
- atomic_add_bw_profile:
149+
- args: 28
150+
accel-sim-mem: 1G
151+
- atomic_add_bw_profile:
152+
- args: 27
153+
accel-sim-mem: 1G
154+
- atomic_add_bw_profile:
155+
- args: 26
156+
accel-sim-mem: 1G
157+
- atomic_add_bw_profile:
158+
- args: 25
159+
accel-sim-mem: 1G
160+
- atomic_add_bw_profile:
161+
- args: 24
162+
accel-sim-mem: 1G
163+
- atomic_add_bw_profile:
164+
- args: 23
165+
accel-sim-mem: 1G
166+
- atomic_add_bw_profile:
167+
- args: 22
168+
accel-sim-mem: 1G
169+
- atomic_add_bw_profile:
170+
- args: 21
171+
accel-sim-mem: 1G
172+
- atomic_add_bw_profile:
173+
- args: 20
174+
accel-sim-mem: 1G
175+
- atomic_add_bw_profile:
176+
- args: 19
177+
accel-sim-mem: 1G
178+
- atomic_add_bw_profile:
179+
- args: 18
180+
accel-sim-mem: 1G
181+
- atomic_add_bw_profile:
182+
- args: 17
183+
accel-sim-mem: 1G
184+
- atomic_add_bw_profile:
185+
- args: 16
186+
accel-sim-mem: 1G
187+
- atomic_add_bw_profile:
188+
- args: 15
189+
accel-sim-mem: 1G
190+
- atomic_add_bw_profile:
191+
- args: 14
192+
accel-sim-mem: 1G
193+
- atomic_add_bw_profile:
194+
- args: 13
195+
accel-sim-mem: 1G
196+
- atomic_add_bw_profile:
197+
- args: 12
198+
accel-sim-mem: 1G
199+
- atomic_add_bw_profile:
200+
- args: 11
201+
accel-sim-mem: 1G
202+
- atomic_add_bw_profile:
203+
- args: 10
204+
accel-sim-mem: 1G
205+
- atomic_add_bw_profile:
206+
- args: 9
207+
accel-sim-mem: 1G
208+
- atomic_add_bw_profile:
209+
- args: 8
210+
accel-sim-mem: 1G
211+
- atomic_add_bw_profile:
212+
- args: 7
213+
accel-sim-mem: 1G
214+
- atomic_add_bw_profile:
215+
- args: 6
216+
accel-sim-mem: 1G
217+
- atomic_add_bw_profile:
218+
- args: 5
219+
accel-sim-mem: 1G
220+
- atomic_add_bw_profile:
221+
- args: 4
222+
accel-sim-mem: 1G
223+
- atomic_add_bw_profile:
224+
- args: 3
225+
accel-sim-mem: 1G
226+
- atomic_add_bw_profile:
227+
- args: 2
228+
accel-sim-mem: 1G
229+
- atomic_add_bw_profile:
230+
- args: 1
231+
accel-sim-mem: 1G
232+
233+
Atomic_Diverge:
234+
exec_dir: "$GPUAPPS_ROOT/bin/$CUDA_VERSION/release/"
235+
data_dirs: "$GPUAPPS_ROOT/data_dirs/"
236+
execs:
237+
- atomic_add_bw_diverge:
238+
- args: 32
239+
accel-sim-mem: 1G
240+
- atomic_add_bw_diverge:
241+
- args: 31
242+
accel-sim-mem: 1G
243+
- atomic_add_bw_diverge:
244+
- args: 30
245+
accel-sim-mem: 1G
246+
- atomic_add_bw_diverge:
247+
- args: 29
248+
accel-sim-mem: 1G
249+
- atomic_add_bw_diverge:
250+
- args: 28
251+
accel-sim-mem: 1G
252+
- atomic_add_bw_diverge:
253+
- args: 27
254+
accel-sim-mem: 1G
255+
- atomic_add_bw_diverge:
256+
- args: 26
257+
accel-sim-mem: 1G
258+
- atomic_add_bw_diverge:
259+
- args: 25
260+
accel-sim-mem: 1G
261+
- atomic_add_bw_diverge:
262+
- args: 24
263+
accel-sim-mem: 1G
264+
- atomic_add_bw_diverge:
265+
- args: 23
266+
accel-sim-mem: 1G
267+
- atomic_add_bw_diverge:
268+
- args: 22
269+
accel-sim-mem: 1G
270+
- atomic_add_bw_diverge:
271+
- args: 21
272+
accel-sim-mem: 1G
273+
- atomic_add_bw_diverge:
274+
- args: 20
275+
accel-sim-mem: 1G
276+
- atomic_add_bw_diverge:
277+
- args: 19
278+
accel-sim-mem: 1G
279+
- atomic_add_bw_diverge:
280+
- args: 18
281+
accel-sim-mem: 1G
282+
- atomic_add_bw_diverge:
283+
- args: 17
284+
accel-sim-mem: 1G
285+
- atomic_add_bw_diverge:
286+
- args: 16
287+
accel-sim-mem: 1G
288+
- atomic_add_bw_diverge:
289+
- args: 15
290+
accel-sim-mem: 1G
291+
- atomic_add_bw_diverge:
292+
- args: 14
293+
accel-sim-mem: 1G
294+
- atomic_add_bw_diverge:
295+
- args: 13
296+
accel-sim-mem: 1G
297+
- atomic_add_bw_diverge:
298+
- args: 12
299+
accel-sim-mem: 1G
300+
- atomic_add_bw_diverge:
301+
- args: 11
302+
accel-sim-mem: 1G
303+
- atomic_add_bw_diverge:
304+
- args: 10
305+
accel-sim-mem: 1G
306+
- atomic_add_bw_diverge:
307+
- args: 9
308+
accel-sim-mem: 1G
309+
- atomic_add_bw_diverge:
310+
- args: 8
311+
accel-sim-mem: 1G
312+
- atomic_add_bw_diverge:
313+
- args: 7
314+
accel-sim-mem: 1G
315+
- atomic_add_bw_diverge:
316+
- args: 6
317+
accel-sim-mem: 1G
318+
- atomic_add_bw_diverge:
319+
- args: 5
320+
accel-sim-mem: 1G
321+
- atomic_add_bw_diverge:
322+
- args: 4
323+
accel-sim-mem: 1G
324+
- atomic_add_bw_diverge:
325+
- args: 3
326+
accel-sim-mem: 1G
327+
- atomic_add_bw_diverge:
328+
- args: 2
329+
accel-sim-mem: 1G
330+
- atomic_add_bw_diverge:
331+
- args: 1
332+
accel-sim-mem: 1G
333+
334+
335+
115336
Deepbench_nvidia_tencore:
116337
exec_dir: "$GPUAPPS_ROOT/bin/$CUDA_VERSION/release/"
117338
data_dirs: "$GPUAPPS_ROOT/data_dirs/"

util/job_launching/run_simulations.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -377,8 +377,9 @@ def text_replace_torque_sim(
377377
)
378378
open(os.path.join(this_run_dir, job_template), "w").write(torque_text)
379379
exec_line = torque_text.splitlines()[-1]
380-
justrunfile = os.path.join(this_run_dir, "justrun.sh")
381-
open(justrunfile, "w").write(exec_name + " " + txt_args + "\n")
380+
justrunfile = os.path.join(this_run_dir , "justrun.sh")
381+
# open(justrunfile, 'w').write(exec_name + " " + txt_args + "\n")
382+
open(justrunfile, 'w').write(exec_name + " " + txt_args + " | tee gpgpu-sim-out_`date '+%b_%d_%H:%M.%S'`.txt")
382383
os.chmod(justrunfile, 0o744)
383384

384385
# replaces all the "REPLACE_*" strings in the gpgpusim.config file

0 commit comments

Comments
 (0)