-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathprofile.sh
executable file
·91 lines (84 loc) · 2.25 KB
/
profile.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
nvidia-smi --lock-gpu-clocks=1590
nvidia-smi --lock-memory-clocks=5000
echo "Matrix size 1024x1024"
echo "Kernel 1"
./build/runner 1 50 1024 1024 1024
echo "Kernel 2"
./build/runner 2 50 1024 1024 1024
echo "Kernel 3"
./build/runner 3 50 1024 1024 1024
echo "Kernel 4"
./build/runner 4 50 1024 1024 1024
echo "Kernel 5"
./build/runner 5 50 1024 1024 1024
echo "Kernel 6"
./build/runner 6 50 1024 1024 1024
echo "cuBLAS HGEMM"
./build/runner 99 50 1024 1024 1024
echo "------------------------------"
echo "Matrix size 2048x2048"
echo "Kernel 1"
./build/runner 1 50 2048 2048 2048
echo "Kernel 2"
./build/runner 2 50 2048 2048 2048
echo "Kernel 3"
./build/runner 3 50 2048 2048 2048
echo "Kernel 4"
./build/runner 4 50 2048 2048 2048
echo "Kernel 5"
./build/runner 5 50 2048 2048 2048
echo "Kernel 6"
./build/runner 6 50 2048 2048 2048
echo "cuBLAS HGEMM"
./build/runner 99 50 2048 2048 2048
echo "------------------------------"
echo "Matrix size 4096x4096"
echo "Kernel 1"
./build/runner 1 50 4096 4096 4096
echo "Kernel 2"
./build/runner 2 50 4096 4096 4096
echo "Kernel 3"
./build/runner 3 50 4096 4096 4096
echo "Kernel 4"
./build/runner 4 50 4096 4096 4096
echo "Kernel 5"
./build/runner 5 50 4096 4096 4096
echo "Kernel 6"
./build/runner 6 50 4096 4096 4096
echo "cuBLAS HGEMM"
./build/runner 99 50 4096 4096 4096
echo "------------------------------"
echo "Matrix size 8192x8192"
echo "Kernel 1"
./build/runner 1 50 8192 8192 8192
echo "Kernel 2"
./build/runner 2 50 8192 8192 8192
echo "Kernel 3"
./build/runner 3 50 8192 8192 8192
echo "Kernel 4"
./build/runner 4 50 8192 8192 8192
echo "Kernel 5"
./build/runner 5 50 8192 8192 8192
echo "Kernel 6"
./build/runner 6 50 8192 8192 8192
echo "cuBLAS HGEMM"
./build/runner 99 50 8192 8192 8192
echo "------------------------------"
echo "Matrix size 16384x16384"
echo "Kernel 1"
./build/runner 1 50 16384 16384 16384
echo "Kernel 2"
./build/runner 2 50 16384 16384 16384
echo "Kernel 3"
./build/runner 3 50 16384 16384 16384
echo "Kernel 4"
./build/runner 4 50 16384 16384 16384
echo "Kernel 5"
./build/runner 5 50 16384 16384 16384
echo "Kernel 6"
./build/runner 6 50 16384 16384 16384
echo "cuBLAS HGEMM"
./build/runner 99 50 16384 16384 16384
echo "------------------------------"
nvidia-smi --reset-gpu-clocks
nvidia-smi --reset-memory-clocks