-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathcommand
More file actions
81 lines (42 loc) · 2.67 KB
/
Copy pathcommand
File metadata and controls
81 lines (42 loc) · 2.67 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
srun -p nvidia -N1 -n1 --gres=gpu:1 ./hw3-2 /home/pp25/pp25s051/share/hw3/testcases/c20.1 ./outc20.1
srun -p nvidia -N1 -n1 --gres=gpu:1 ./hw3-2 /home/pp25/pp25s051/share/hw3/testcases/p11k1 ./p11k1
srun -p nvidia -N1 -n1 --gres=gpu:1 ./hw3-2 /home/pp25/pp25s051/share/hw3/testcases/p15k1 ./p15k1
srun -p nvidia -N1 -n1 --gres=gpu:1 ./hw3-2 /home/pp25/pp25s051/share/hw3/testcases/p20k1 ./p20k1
srun -p nvidia -N1 -n1 --gres=gpu:1 ./hw3-2 /home/pp25/pp25s051/share/hw3/testcases/p25k1 ./p25k1
srun -p nvidia -N1 -n1 --gres=gpu:2 ./hw3-3 /home/pp25/pp25s051/share/hw3/testcases/p33k1 ./outp33k1
srun -n 1 --gres=gpu:1 /home/pp25/pp25s051/deviceQuery/deviceQuery
srun -N1 -n1 ./hw3-1 /home/pp25/pp25s051/share/hw3/testcases/c21.1 ./outc21.1
srun -p nvidia -N1 -n1 --gres=gpu:1 ./hw3-2 /home/pp25/pp25s051/share/hw3/testcases/c20.1 ./outc20.1
srun -p amd -N1 -n1 --gres=gpu:1 ./hw3-2-amd /home/pp25/pp25s051/share/hw3/testcases/c21.1 ./outc21.1
srun -p amd -N1 -n1 --gres=gpu:1 rocprof --stats ./hw3-2-amd /home/pp25/pp25s051/share/hw3/testcases/c21.1 ./outc21.1
srun -p amd -N1 -n1 --gres=gpu:1 \
rocprof --stats -o stats_bsz64.csv \
./hw3-2-amd ./hw3-2-amd /home/pp25/pp25s051/share/hw3/testcases/c21.1 ./outc21.1
srun -p amd -N1 -n1 --gres=gpu:1 \
rocprof --stats -o stats_bsz32.csv \
./hw3-2-amd ./hw3-2-amd /home/pp25/pp25s051/share/hw3/testcases/c21.1 ./outc21.1
srun -p amd -N1 -n1 --gres=gpu:1 \
rocprof --stats -o stats_bsz64.csv \
./hw3-2-amd ./hw3-2-amd /home/pp25/pp25s051/share/hw3/testcases/c21.1 ./outc21.1
srun -p amd -N1 -n1 --gres=gpu:1 ./hw3-2-amd /home/pp25/pp25s051/share/hw3/testcases/p26k1 p26k1
srun -p amd -N1 -n1 --gres=gpu:1 ./hw4-amd /home/pp25/pp25s051/share/hw4/testcases-amd/t01 out
srun -p nvidia -N1 -n1 --gres=gpu:1 nvprof --metrics gld_throughput
/home/pp25/pp25s051/share/hw4/testcases/t25
srun -p nvidia -N1 -n1 --gres=gpu:1 \
nvprof --metrics \
achieved_occupancy,sm_efficiency,shared_load_throughput,shared_store_throughput,gld_throughput,gst_throughput \
./hw4 /home/pp25/share/hw4/testcases/t25 t25.out
srun -p nvidia -N1 -n1 --gres=gpu:1 ./hw4 /home/pp25/share/hw4/testcases/t25 t25.out
srun -p amd -N1 -n1 --gres=gpu:1 \
rocprof --stats \
./hw4-amd /home/pp25/share/hw4/testcases/t25 t25.out
srun -p amd -N1 -n1 --gres=gpu:1 \
./hw4-amd /home/pp25/share/hw4/testcases/t25 t25.out
srun -p amd -N1 -n1 --gres=gpu:1 \
./hw4-amd /home/pp25/share/hw4/testcases/t30 t30.out
srun -p amd -N1 -n1 --gres=gpu:1 \
./hw4-amd /home/pp25/share/hw4/testcases/t15 t15.out
srun -p nvidia -N1 -n1 --gres=gpu:1 \
nvprof \
./hw4 /home/pp25/share/hw4/testcases/t25 t25.out
# rocprof --timestamp on --hip-trace --hsa-trace ./a.out input.bin output.bin