| 8 |
A2A |
non-parallel |
8 |
4x8 |
2 |
1x8 |
8192 |
((8, 8, 128)) |
2.46E-05 |
4 |
f32[8,8,128] |
f32[8,8,128]{2,1,0:T(8,128) |
{{0,1,2,3,4,5,6,7},{8,9,10,11,12,13,14,15},{16,17,18,19,20,21,22,23},{24,25,26,27,28,29,30,31}} |
0.008563025 |
0.008734933799999999 |
0.00879183640.00883735848 |
0.008537815 |
0.008848739 |
5 |
0.008272509 |
2.8700138093722725 |
2.947142047540046 |
2.9589728528886137 |
2.9684374971674674 |
2.8798846636937085 |
2.970803658237181 |
5 |
2.777344884960445 |
|
| 16 |
A2A |
non-parallel |
8 |
4x8 |
2 |
1x8 |
16384 |
((16, 8, 128)) |
4.92E-05 |
4 |
f32[16,8,128] |
f32[16,8,128]{2,1,0:T(8,128) |
{{0,1,2,3,4,5,6,7},{8,9,10,11,12,13,14,15},{16,17,18,19,20,21,22,23},{24,25,26,27,28,29,30,31}} |
0.0087491 |
0.0088256904 |
0.0088348142 |
0.008842113240000001 |
0.00874958 |
0.008843938 |
5 |
0.008639856 |
5.617949274782551 |
5.668926070677588 |
5.678954887980783 |
5.686977941823339 |
5.6179998946065774 |
5.688983705283978 |
55.55770517613308 |
|
| 32 |
A2A |
non-parallel |
8 |
4x8 |
2 |
1x8 |
32768 |
((32, 8, 128)) |
9.83E-05 |
4 |
f32[32,8,128] |
f32[32,8,128]{2,1,0:T(8,128) |
{{0,1,2,3,4,5,6,7},{8,9,10,11,12,13,14,15},{16,17,18,19,20,21,22,23},{24,25,26,27,28,29,30,31}} |
0.009254502 |
0.009404802 |
0.009412485 |
0.0094186314 |
0.009276590599999999 |
0.009420168 |
5 |
0.009130852 |
10.62228956242054 |
10.7357777581096 |
10.750957184181201 |
10.763100725038482 |
10.59847213318989 |
10.766136610252802 |
510.4354826792898 |
|
| 64 |
A2A |
non-parallel |
8 |
4x8 |
2 |
1x8 |
65536 |
((64, 8, 128)) |
0.00019660800000000003 |
4 |
f32[64,8,128] |
f32[64,8,128]{2,1,0:T(8,128) |
{{0,1,2,3,4,5,6,7},{8,9,10,11,12,13,14,15},{16,17,18,19,20,21,22,23},{24,25,26,27,28,29,30,31}} |
0.010660264 |
0.0107322934 |
0.0107442982 |
0.01075390204 |
0.010629532 |
0.010756303 |
5 |
0.010483794 |
18.443070453039443 |
18.705720804781432 |
18.72961847298997 |
18.7487366075568 |
18.497997026276316 |
18.753516141198507 |
5 |
18.27839918604004 |
| 128 |
A2A |
non-parallel |
8 |
4x8 |
2 |
1x8 |
131072 |
((128, 8, 128)) |
0.00039321600000000005 |
4 |
f32[128,8,128] |
f32[128,8,128]{2,1,0:T(8,128) |
{{0,1,2,3,4,5,6,7},{8,9,10,11,12,13,14,15},{16,17,18,19,20,21,22,23},{24,25,26,27,28,29,30,31}} |
0.013602641 |
0.0136981992 |
0.0137164466 |
0.013731044520000001 |
0.013605522200000001 |
0.013734694 |
5 |
0.013506603 |
28.90732762850979 |
29.0839631046883 |
29.098417393391674 |
29.109980824354377 |
28.9022087992601 |
29.11287168209505 |
528.6293964758152 |
|
| 256 |
A2A |
non-parallel |
8 |
4x8 |
2 |
1x8 |
262144 |
((256, 8, 128)) |
0.0007864320000000001 |
4 |
f32[256,8,128] |
f32[256,8,128]{2,1,0:T(8,128) |
{{0,1,2,3,4,5,6,7},{8,9,10,11,12,13,14,15},{16,17,18,19,20,21,22,23},{24,25,26,27,28,29,30,31}} |
0.018792317 |
0.018972629 |
0.019007923 |
0.0190361582 |
0.018821848800000002 |
0.019043217 |
5 |
0.018619448 |
41.848591634549386 |
42.085991701888126 |
42.16155962361874 |
42.22201396100324 |
41.785145728040824 |
42.23712754534937 |
541.2972240982183 |
|
| 512 |
A2A |
non-parallel |
8 |
4x8 |
2 |
1x8 |
524288 |
((512, 8, 128)) |
0.0015728640000000002 |
4 |
f32[512,8,128] |
f32[512,8,128]{2,1,0:T(8,128) |
{{0,1,2,3,4,5,6,7},{8,9,10,11,12,13,14,15},{16,17,18,19,20,21,22,23},{24,25,26,27,28,29,30,31}} |
0.03054982 |
0.030619688 |
0.0306273709999999970.030633517399999997 |
0.0305560626 |
0.030635054 |
5 |
0.030462185 |
51.485213333499196 |
51.58298787134468 |
51.60815810470684 |
51.628294291396564 |
51.47488373996223 |
51.633328338069 |
5 |
51.34196923563446 |
|
| 1024 |
A2A |
non-parallel |
8 |
4x8 |
2 |
1x8 |
1048576 |
((1024, 8, 128)) |
0.0031457280000000004 |
4 |
f32[1024,8,128] |
f32[1024,8,128]{2,1,0:T(8,128) |
{{0,1,2,3,4,5,6,7},{8,9,10,11,12,13,14,15},{16,17,18,19,20,21,22,23},{24,25,26,27,28,29,30,31}} |
0.052659064 |
0.05272509 |
0.0527322930.0527380554 |
0.052642017 |
0.052739496 |
5 |
0.052541417 |
59.737636050652185 |
59.85991101808027 |
59.86565366503011 |
59.870247782589985 |
59.757107524934476 |
59.87139631197995 |
5 |
59.64653132066337 |
|
| 2048 |
A2A |
non-parallel |
8 |
4x8 |
2 |
1x8 |
2097152 |
((2048, 8, 128)) |
0.006291456000000001 |
4 |
f32[2048,8,128] |
f32[2048,8,128]{2,1,0:T(8,128) |
{{0,1,2,3,4,5,6,7},{8,9,10,11,12,13,14,15},{16,17,18,19,20,21,22,23},{24,25,26,27,28,29,30,31}} |
0.097747899 |
0.0979452578 |
0.09799183640.09802909928 |
0.0977875148 |
0.098038415 |
5 |
0.097648259 |
64.36410464433615 |
64.41679769761421 |
64.4232896437367 |
64.42848320063467 |
64.33815347050663 |
64.42978158985918 |
5 |
64.17337530395612 |
|
| 4096 |
A2A |
non-parallel |
8 |
4x8 |
2 |
1x8 |
4194304 |
((4096, 8, 128)) |
0.012582912000000002 |
4 |
f32[4096,8,128] |
f32[4096,8,128]{2,1,0:T(8,128) |
{{0,1,2,3,4,5,6,7},{8,9,10,11,12,13,14,15},{16,17,18,19,20,21,22,23},{24,25,26,27,28,29,30,31}} |
0.188061224 |
0.188235054 |
0.1882621850.18828388980000002 |
0.1880792316 |
0.188289316 |
5 |
0.187936375 |
66.90859355461816 |
66.95030520692961 |
66.95167358031136 |
66.95276827901677 |
66.90221981343015 |
66.95304195369312 |
566.8275410804509 |
|
|
| 8192 |
A2A |
non-parallel |
8 |
4x8 |
2 |
1x8 |
8388608 |
((8192, 8, 128)) |
0.025165824000000003 |
4 |
f32[8192,8,128] |
f32[8192,8,128]{2,1,0:T(8,128) |
{{0,1,2,3,4,5,6,7},{8,9,10,11,12,13,14,15},{16,17,18,19,20,21,22,23},{24,25,26,27,28,29,30,31}} |
0.368863145 |
0.3691212486 |
0.36916206479999997 |
0.36919471775999996 |
0.3688938776 |
0.369202881 |
5 |
0.368669868 |
68.22536851709596 |
68.25633569983937 |
68.25873585175053 |
68.26065597327946 |
68.21970299159307 |
68.26113600366169 |
5 |
68.16258836290068 |
Results summary
all_to_all_1d
all_to_all_2d
all_to_all_3d