-
Notifications
You must be signed in to change notification settings - Fork 21
/
timing_data.tsv
We can make this file beautiful and searchable if this error is corrected: It looks like row 4 should actually have 1 column, instead of 5 in line 3.
249 lines (234 loc) · 11.8 KB
/
timing_data.tsv
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
Ubuntu 18.04.1 LTS
g++ 9.2.1 with -O3
Intel Core i9-9900 @ 3.1GHz, single threaded
Operation result_nvals opt3.0_runtime_usec seq3.0_runtime_usec seq2.0.2_runtime_usec
IMPLEMENTATION: A*B
C := A+.*B 413601 14228 18319 6.79627e+06
C := C + A+.*B 413601 17151 20188 6.89181e+06
C<M,merge> := A+.*B 413601 9617 20098 6.58332e+06
C<M,replace> := A+.*B 44830 6027 17362 6.71729e+06
C<M,merge> := C + A+.*B 44830 7652 19649 6.53923e+06
C<M,replace> := C + A+.*B 44830 8785 19887 6.67295e+06
C<!M,merge> := A+.*B 413601 16682 343076 7.71499e+06
C<!M,replace> := A+.*B 368771 16592 308104 7.69739e+06
C<!M,merge> := C + A+.*B 368771 17573 373355 7.80115e+06
C<!M,replace> := C + A+.*B 368771 18506 315928 8.28012e+06
C<s(M),merge> := A+.*B 413601 8862 22071
C<s(M),replace> := A+.*B 44830 5770 19092
C<s(M),merge> := C + A+.*B 44830 11616 22608
C<s(M),replace> := C + A+.*B 44830 7524 19116
C<!s(M),merge> := A+.*B 413601 15862 331938
C<!s(M),replace> := A+.*B 368771 18016 289155
C<!s(M),merge> := C + A+.*B 368771 21548 357168
C<!s(M),replace> := C + A+.*B 368771 17337 290589
IMPLEMENTATION: A'*B
C := A'+.*B 413601 24575 19228 1.05907e+10
C := C + A'+.*B 413601 23914 20756 1.04975e+10
C<M,merge> := A'+.*B 413601 10061 21204 1.03085e+10
C<M,replace> := A+.*B 44830 6930 18792
C<M,merge> := C + A'+.*B 44830 12129 21802
C<M,replace> := C + A'+.*B 44830 9170 18136
C<!M,merge> := A'+.*B 413601 24873 351930
C<!M,replace> := A'+.*B 368771 23142 326782
C<!M,merge> := C + A'+.*B 368771 25084 400182
C<!M,replace> := C + A'+.*B 368771 25461 305521
C<s(M),merge> := A'+.*B 413601 11006 24582
C<s(M),replace> := A+.*B 44830 12749 20212
C<s(M),merge> := C + A'+.*B 44830 8998 23582
C<s(M),replace> := C + A'+.*B 44830 8025 20100
C<!s(M),merge> := A'+.*B 413601 27676 327496
C<!s(M),replace> := A'+.*B 368771 22756 283444
C<!s(M),merge> := C + A'+.*B 368771 28101 354580
C<!s(M),replace> := C + A'+.*B 368771 23901 286720
IMPLEMENTATION: A*B'
C := A+.*B' 413601 1.91157e+06 1.92264e+06 5.18809e+06
C := C + A+.*B' 413601 2.00197e+06 1.89916e+06 5.86669e+06
C<M,merge> := A+.*B' 413601 102858 1.91731e+06 5.44134e+06
C<M,replace> := A+.*B' 44830 100953 1.91211e+06 4.89272e+06
C<M,merge> := C + A+.*B' 44830 108823 1.87085e+06 5.12763e+06
C<M,replace> := C + A+.*B' 44830 109496 1.89146e+06 4.94909e+06
C<!M,merge> := A+.*B' 413601 1.85566e+06 2.24264e+06 7.26532e+06
C<!M,replace> := A+.*B' 368771 1.82126e+06 2.19104e+06 7.77947e+06
C<!M,merge> := C + A+.*B' 368771 1.86196e+06 2.31851e+06 7.97069e+06
C<!M,replace> := C + A+.*B' 368771 1.87124e+06 2.23134e+06 7.55298e+06
C<s(M),merge> := A+.*B' 413601 102875 1.93001e+06
C<s(M),replace> := A+.*B' 44830 97274 1.91891e+06
C<s(M),merge> := C + A+.*B' 44830 103801 1.94145e+06
C<s(M),replace> := C + A+.*B' 44830 107283 1.93083e+06
C<!s(M),merge> := A+.*B' 413601 1.8506e+06 2.1814e+06
C<!s(M),replace> := A+.*B' 368771 1.88142e+06 2.19568e+06
C<!s(M),merge> := C + A+.*B' 368771 1.89935e+06 2.26707e+06
C<!s(M),replace> := C + A+.*B' 368771 1.8806e+06 2.20845e+06
IMPLEMENTATION: A'*B'
C := A'+.*B' 413601 14262 22368 1.18102e+10
C := C + A'+.*B' 413601 30759 26622 1.14332e+10
C<M,merge> := A'+.*B' 413601 29904 27211 1.04933e+10
C<M,replace> := A'+.*B' 44830 25097 23843 1.04987e+10
C<M,merge> := C + A'+.*B' 44830 23587 26141 1.09838e+10
C<M,replace> := C + A'+.*B' 44830 25392 23062 1.0811e+10
C<!M,merge> := A'+.*B' 413601 28242 355720 1.03199e+10
C<!M,replace> := A'+.*B' 368771 27294 308354 1.03032e+10
C<!M,merge> := C + A'+.*B' 368771 32252 379830 1.09707e+10
C<!M,replace> := C + A'+.*B' 368771 29390 317011 1.09911e+10
C<s(M),merge> := A'+.*B' 413601 26210 26248
C<s(M),replace> := A'+.*B' 44830 24262 23398
C<s(M),merge> := C + A'+.*B' 44830 23213 24272
C<s(M),replace> := C + A'+.*B' 44830 25317 24151
C<!s(M),merge> := A'+.*B' 413601 29118 328156
C<!s(M),replace> := A'+.*B' 368771 26089 290723
C<!s(M),merge> := C + A'+.*B' 368771 30463 363853
C<!s(M),replace> := C + A'+.*B' 368771 28793 288954
Operation result_nvals 3.0_runtime_usec seq2.0.2_runtime_usec checksum
IMPLEMENTATION: A*u
w := A+.*u 3289 3386 5489 5104
w := w + A+.*u 3289 3254 4952 10208
w<m,merge> := A+.*u 3289 3181 7659 9460
w<m,replace> := A+.*u 485 2912 5885 748
w<m,merge> := w + A+.*u 485 3233 6104 1496
w<m,replace> := w + A+.*u 485 3207 5383 2244
w<!m,merge> := A+.*u 3289 3175 5993 6600
w<!m,replace> := A+.*u 2804 3362 6944 4356
w<!m,merge> := w + A+.*u 2804 3908 5040 8712
w<!m,replace> := w + A+.*u 2804 3086 5042 13068
w<s(m),replace> := A+.*u 485 2992 748
w<s(m),merge> := w + A+.*u 485 3444 1496
w<s(m),replace> := w + A+.*u 485 2873 2244
w<!s(m),merge> := A+.*u 3289 3259 6600
w<!s(m),replace> := A+.*u 2804 3698 4356
w<!s(m),merge> := w + A+.*u 2804 3168 8712
w<!s(m),replace> := w + A+.*u 2804 3513 13068
IMPLEMENTATION: A'*u
w := A'+.*u 3289 1071 930946 5104
w := w + A'+.*u 3289 1020 942266 10208
w<m,merge> := A'+.*u 3289 1073 1.04539e+06 9460
w<m,replace> := A'+.*u 485 1058 1.0503e+06 748
w<m,merge> := w + A'+.*u 485 1055 1.13544e+06 1496
w<m,replace> := w + A'+.*u 485 1051 1.12552e+06 2244
w<!m,merge> := A'+.*u 3289 1161 1.02462e+06 6600
w<!m,replace> := A'+.*u 2804 1114 1.02251e+06 4356
w<!m,merge> := w + A'+.*u 2804 1147 1.11604e+06 8712
w<!m,replace> := w + A'+.*u 2804 1147 1.11864e+06 13068
w<s(m),merge> := A'+.*u 3289 1255 13816
w<s(m),replace> := A+.*u 485 1126 748
w<s(m),merge> := w + A'+.*u 485 1091 1496
w<s(m),replace> := w + A'+.*u 485 1125 2244
w<!s(m),merge> := A'+.*u 3289 1134 6600
w<!s(m),replace> := A'+.*u 2804 1141 4356
w<!s(m),merge> := w + A'+.*u 2804 1218 8712
w<!s(m),replace> := w + A'+.*u 2804 1200 13068
Results PASSED
IMPLEMENTATION: u'*A
w' := u'+.*A 3289 1395 1.09945e+06 5104
w' := w' + u'+.*A 3289 1343 948561 10208
w'<m',merge> := u'+.*A 3289 1387 1.08011e+06 9460
w'<m',replace> := u'+.*A 485 1438 1.06922e+06 748
w'<m',merge> := w' + u'+.*A 485 1365 1.01722e+06 1496
w'<m',replace> := w' + u'+.*A 485 1933 1.02241e+06 2244
w'<!m',merge> := u'+.*A 3289 1875 1.05708e+06 6600
w'<!m',replace> := u'+.*A 2804 1609 1.05496e+06 4356
w'<!m',merge> := w' + u'+.*A 2804 1548 1.02734e+06 8712
w'<!m',replace> := w' + u'+.*A 2804 1651 1.0334e+06 13068
w'<s(m'),merge> := u'+.*A 3289 1417 13816
w'<s(m'),replace> := u'+.*A 485 1397 748
w'<s(m'),merge> := w' + u'+.*A 485 1416 1496
w'<s(m'),replace> := w' + u'+.*A 485 1504 2244
w'<!s(m'),merge> := u'+.*A 3289 1950 6600
w'<!s(m'),replace> := u'+.*A 2804 1528 4356
w'<!s(m'),merge> := w' + u'+.*A 2804 1488 8712
w'<!s(m'),replace> := w' + u'+.*A 2804 1492 13068
IMPLEMENTATION: u'*A'
w' := u'+.*A' 3289 3177 3184 5104
w' := w' + u'+.*A' 3289 2998 3193 10208
w'<m',merge> := u'+.*A' 3289 2878 2886 9460
w'<m',replace> := u'+.*A' 485 2978 3084 748
w'<m',merge> := w' + u'+.*A' 485 2792 3458 1496
w'<m',replace> := w' + u'+.*A' 485 2884 2822 2244
w'<!m',merge> := u'+.*A' 3289 2947 2940 6600
w'<!m',replace> := u'+.*A' 2804 2900 3035 4356
w'<!m',merge> := w' + u'+.*A' 2804 3296 3398 8712
w'<!m',replace> := w' + u'+.*A' 2804 2953 3847 13068
w'<s(m'),merge> := u'+.*A' 3289 2971 13816
w'<s(m'),replace> := u'+.*A' 485 3068 748
w'<s(m'),merge> := w' + u'+.*A' 485 3264 1496
w'<s(m'),replace> := w' + u'+.*A' 485 2964 2244
w'<!s(m'),merge> := u'+.*A' 3289 3177 6600
w'<!s(m'),replace> := u'+.*A' 2804 3205 4356
w'<!s(m'),merge> := w' + u'+.*A' 2804 3010 8712
w'<!s(m'),replace> := w' + u'+.*A' 2804 3266 13068
Operation result_nvals 3.0_runtime_usec seq2.0.2_runtime_usec checksum
IMPLEMENTATION: A.*B
C := A.*B 37656 1861 2856 37656
C := C + A.*B 37656 1733 2287 75312
C<M,merge> := A.*B 37656 34972 38833 69759
C<M,replace> := A.*B 5553 27232 28687 5553
C<M,merge> := C + A.*B 5553 30760 38819 11106
C<M,replace> := C + A.*B 5553 26807 29299 16659
C<!M,merge> := A.*B 37656 344391 483427 48762
C<!M,replace> := A.*B 32103 312328 435168 32103
C<!M,merge> := C + A.*B 32103 367121 491110 64206
C<!M,replace> := C + A.*B 32103 309113 436658 96309
C<s(M),merge> := A.*B 37656 57994 101862
C<s(M),replace> := A.*B 5553 44261 5553
C<s(M),merge> := C + A.*B 5553 48590 11106
C<s(M),replace> := C + A.*B 5553 61481 16659
C<!s(M),merge> := A.*B 37656 345549 48762
C<!s(M),replace> := A.*B 32103 287347 32103
C<!s(M),merge> := C + A.*B 32103 350560 64206
C<!s(M),replace> := C + A.*B 32103 286933 96309
IMPLEMENTATION: A'*B
C := A'.*B 37678 4895 978188 37678
C := C + A'.*B 37678 4533 972740 75356
C<M,merge> := A'.*B 37678 40180 1.0293e+06 69871
C<M,replace> := A.*B 5485 31267 1.01838e+06 5485
C<M,merge> := C + A'.*B 5485 35506 997943 10970
C<M,replace> := C + A'.*B 5485 30744 1.00033e+06 16455
C<!M,merge> := A'.*B 37678 344986 1.4846e+06 48648
C<!M,replace> := A'.*B 32193 313091 1.45002e+06 32193
C<!M,merge> := C + A'.*B 32193 370772 1.47911e+06 64386
C<!M,replace> := C + A'.*B 32193 312804 1.43596e+06 96579
C<s(M),merge> := A'.*B 37678 59272 102064
C<s(M),replace> := A.*B 5485 48640 5485
C<s(M),merge> := C + A'.*B 5485 51755 10970
C<s(M),replace> := C + A'.*B 5485 46890 16455
C<!s(M),merge> := A'.*B 37678 327240 48648
C<!s(M),replace> := A'.*B 32193 292907 32193
C<!s(M),merge> := C + A'.*B 32193 348970 64386
C<!s(M),replace> := C + A'.*B 32193 289895 96579
IMPLEMENTATION: A*B'
C := A.*B' 37678 4838 1.00625e+06 37678
C := C + A.*B' 37678 4629 1.03707e+06 75356
C<M,merge> := A.*B' 37678 39471 1.09814e+06 69770
C<M,replace> := A.*B' 5586 32006 1.07943e+06 5586
C<M,merge> := C + A.*B' 5586 34434 1.02308e+06 11172
C<M,replace> := C + A.*B' 5586 31390 1.02341e+06 16758
C<!M,merge> := A.*B' 37678 347821 1.4815e+06 48850
C<!M,replace> := A.*B' 32092 313375 1.43834e+06 32092
C<!M,merge> := C + A.*B' 32092 372205 1.49655e+06 64184
C<!M,replace> := C + A.*B' 32092 312803 1.45583e+06 96276
C<s(M),merge> := A.*B' 37678 60061 101862
C<s(M),replace> := A.*B' 5586 49840 5586
C<s(M),merge> := C + A.*B' 5586 51848 11172
C<s(M),replace> := C + A.*B' 5586 47276 16758
C<!s(M),merge> := A.*B' 37678 324700 48850
C<!s(M),replace> := A.*B' 32092 290714 32092
C<!s(M),merge> := C + A.*B' 32092 350357 64184
C<!s(M),replace> := C + A.*B' 32092 291534 96276
IMPLEMENTATION: A'*B'
C := A'.*B' 37656 2361 1.90801e+06 37656
C := C + A'.*B' 37656 2124 1.90345e+06 75312
C<M,merge> := A'.*B' 37656 35225 1.90978e+06 69754
C<M,replace> := A'.*B' 5558 27634 1.88757e+06 5558
C<M,merge> := C + A'.*B' 5558 31396 1.91595e+06 11116
C<M,replace> := C + A'.*B' 5558 27161 1.91335e+06 16674
C<!M,merge> := A'.*B' 37656 342344 2.34857e+06 48772
C<!M,replace> := A'.*B' 32098 310123 2.30649e+06 32098
C<!M,merge> := C + A'.*B' 32098 369931 2.33798e+06 64196
C<!M,replace> := C + A'.*B' 32098 310697 2.29018e+06 96294
C<s(M),merge> := A'.*B' 37656 53507 101852
C<s(M),replace> := A'.*B' 5558 45691 5558
C<s(M),merge> := C + A'.*B' 5558 49552 11116
C<s(M),replace> := C + A'.*B' 5558 44821 16674
C<!s(M),merge> := A'.*B' 37656 322097 48772
C<!s(M),replace> := A'.*B' 32098 287250 32098
C<!s(M),merge> := C + A'.*B' 32098 349375 64196
C<!s(M),replace> := C + A'.*B' 32098 289946 96294