-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathall-cpu-gpu-mm-timings.txt
50 lines (50 loc) · 2.58 KB
/
all-cpu-gpu-mm-timings.txt
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
n m ||| CPUForLoops CPUEigenMv CPUEigenMM cublasMM
256 256 ||| 0.0324803 0.00196201 0.000875768 8.8513e-05
256 512 ||| 0.0505194 0.00340229 0.00121345 0.000104882
256 1024 ||| 0.0766311 0.00522265 0.00157235 0.000169133
256 2048 ||| 0.137887 0.00781341 0.00207219 0.000293894
256 4096 ||| 0.275083 0.0152978 0.00408318 0.000533788
256 8192 ||| 0.581185 0.0308976 0.0083212 0.00101935
256 16384 ||| 1.25832 0.0687339 0.0172546 0.00198313
512 256 ||| 0.0342268 0.00183152 0.000629319 9.789e-05
512 512 ||| 0.0690569 0.00360493 0.00101234 0.000140424
512 1024 ||| 0.140117 0.00715944 0.00191271 0.000234157
512 2048 ||| 0.283161 0.0143068 0.00370366 0.000420704
512 4096 ||| 1.03346 0.0292042 0.00792468 0.000782422
512 8192 ||| 2.72327 0.0818505 0.0168892 0.00151836
512 16384 ||| 9.7187 0.343331 0.0331934 0.00307129
1024 256 ||| 0.0713907 0.00367979 0.00104544 0.000167425
1024 512 ||| 0.1458 0.00728184 0.00199655 0.000218154
1024 1024 ||| 0.294579 0.0144848 0.00386971 0.00037861
1024 2048 ||| 2.11281 0.0291591 0.00813351 0.00080798
1024 4096 ||| 4.13805 0.0766496 0.0169549 0.00142428
1024 8192 ||| 9.40453 0.251935 0.0322193 0.00262466
1024 16384 ||| 24.3075 0.514823 0.0645524 0.00465125
2048 256 ||| 0.142645 0.00822824 0.00201344 0.000229572
2048 512 ||| 0.290412 0.0163487 0.00429587 0.000377616
2048 1024 ||| 2.08744 0.0329292 0.00827569 0.000639239
2048 2048 ||| 4.23547 0.103746 0.0186084 0.0011467
2048 4096 ||| 9.8823 0.282378 0.0323487 0.00218326
2048 8192 ||| 27.0018 0.57826 0.0642626 0.00386335
2048 16384 ||| 54.2227 1.15597 0.128188 0.00798399
4096 256 ||| 0.297484 0.0166134 0.00492434 0.000378427
4096 512 ||| 2.08781 0.0334282 0.0102024 0.000575507
4096 1024 ||| 3.77705 0.0796326 0.0191328 0.000942531
4096 2048 ||| 10.9048 0.287159 0.0329666 0.00195221
4096 4096 ||| 27.2921 0.574098 0.0643499 0.00337177
4096 8192 ||| 49.522 1.43633 0.13274 0.00675155
4096 16384 ||| 97.2304 3.14265 0.267085 0.012899
8192 256 ||| 2.12882 0.0322599 0.0125839 0.00061284
8192 512 ||| 3.80707 0.0814274 0.0279265 0.000956158
8192 1024 ||| 10.7353 0.279874 0.0376528 0.00166894
8192 2048 ||| 31.2598 0.582645 0.0777618 0.0029932
8192 4096 ||| 54.2438 1.24568 0.138018 0.00586591
8192 8192 ||| 112.888 3.06222 0.290453 0.0114775
8192 16384 ||| 231.065 4.62829 0.556746 0.022804
16384 256 ||| 1.099 0.068789 0.0216357 0.000870151
16384 512 ||| 15.8341 0.347667 0.0465036 0.00149914
16384 1024 ||| 35.2164 0.682984 0.0846369 0.00275091
16384 2048 ||| 67.0375 2.11604 0.159178 0.00526287
16384 4096 ||| 146.657 2.75023 0.308909 0.0103676
16384 8192 ||| 272.837 9.44329 0.622271 0.020922
16384 16384 ||| 550.109 10.9461 1.19432 0.0405363