From 3973ca1a0630ed5668b90d8e9a5e8934636ed5ec Mon Sep 17 00:00:00 2001 From: Adrian Kummerlaender Date: Thu, 4 Jul 2019 00:02:32 +0200 Subject: Update benchmark results of LDC @ Tesla P100 --- result/ldc_2d_benchmark_P100.log | 470 ++++++++++++++++++++++++++------------- result/ldc_2d_benchmark_P100.py | 2 +- result/ldc_3d_benchmark_P100.log | 444 ++++++++++++++++++++++++------------ result/ldc_3d_benchmark_P100.py | 2 +- 4 files changed, 616 insertions(+), 302 deletions(-) (limited to 'result') diff --git a/result/ldc_2d_benchmark_P100.log b/result/ldc_2d_benchmark_P100.log index 3bacbe6..a8cc599 100644 --- a/result/ldc_2d_benchmark_P100.log +++ b/result/ldc_2d_benchmark_P100.log @@ -1,156 +1,314 @@ -(32, (16, 1), 'single', True): ~14 MLUPS -(32, (16, 1), 'single', False): ~15 MLUPS -(32, (16, 1), 'double', True): ~15 MLUPS -(32, (16, 1), 'double', False): ~15 MLUPS -(32, (32, 1), 'single', True): ~14 MLUPS -(32, (32, 1), 'single', False): ~15 MLUPS -(32, (32, 1), 'double', True): ~15 MLUPS -(32, (32, 1), 'double', False): ~15 MLUPS -(64, (16, 1), 'single', True): ~58 MLUPS -(64, (16, 1), 'single', False): ~59 MLUPS -(64, (16, 1), 'double', True): ~59 MLUPS -(64, (16, 1), 'double', False): ~56 MLUPS -(64, (32, 1), 'single', True): ~60 MLUPS -(64, (32, 1), 'single', False): ~59 MLUPS -(64, (32, 1), 'double', True): ~59 MLUPS -(64, (32, 1), 'double', False): ~59 MLUPS -(64, (64, 1), 'single', True): ~60 MLUPS -(64, (64, 1), 'single', False): ~58 MLUPS -(64, (64, 1), 'double', True): ~59 MLUPS -(64, (64, 1), 'double', False): ~59 MLUPS -(96, (16, 1), 'single', True): ~133 MLUPS -(96, (16, 1), 'single', False): ~132 MLUPS -(96, (16, 1), 'double', True): ~133 MLUPS -(96, (16, 1), 'double', False): ~126 MLUPS -(96, (24, 1), 'single', True): ~129 MLUPS -(96, (24, 1), 'single', False): ~133 MLUPS -(96, (24, 1), 'double', True): ~134 MLUPS -(96, (24, 1), 'double', False): ~133 MLUPS -(96, (32, 1), 'single', True): ~134 MLUPS -(96, (32, 1), 'single', False): ~133 MLUPS -(96, (32, 1), 'double', True): ~134 MLUPS -(96, (32, 1), 'double', False): ~134 MLUPS -(96, (48, 1), 'single', True): ~133 MLUPS -(96, (48, 1), 'single', False): ~135 MLUPS -(96, (48, 1), 'double', True): ~135 MLUPS -(96, (48, 1), 'double', False): ~133 MLUPS -(96, (96, 1), 'single', True): ~136 MLUPS -(96, (96, 1), 'single', False): ~135 MLUPS -(96, (96, 1), 'double', True): ~136 MLUPS -(96, (96, 1), 'double', False): ~136 MLUPS -(128, (16, 1), 'single', True): ~240 MLUPS -(128, (16, 1), 'single', False): ~220 MLUPS -(128, (16, 1), 'double', True): ~222 MLUPS -(128, (16, 1), 'double', False): ~204 MLUPS -(128, (32, 1), 'single', True): ~218 MLUPS -(128, (32, 1), 'single', False): ~237 MLUPS -(128, (32, 1), 'double', True): ~240 MLUPS -(128, (32, 1), 'double', False): ~242 MLUPS -(128, (64, 1), 'single', True): ~241 MLUPS -(128, (64, 1), 'single', False): ~240 MLUPS -(128, (64, 1), 'double', True): ~241 MLUPS -(128, (64, 1), 'double', False): ~237 MLUPS -(128, (128, 1), 'single', True): ~239 MLUPS -(128, (128, 1), 'single', False): ~238 MLUPS -(128, (128, 1), 'double', True): ~238 MLUPS -(128, (128, 1), 'double', False): ~238 MLUPS -(256, (16, 1), 'single', True): ~953 MLUPS -(256, (16, 1), 'single', False): ~932 MLUPS -(256, (16, 1), 'double', True): ~957 MLUPS -(256, (16, 1), 'double', False): ~906 MLUPS -(256, (32, 1), 'single', True): ~972 MLUPS -(256, (32, 1), 'single', False): ~963 MLUPS -(256, (32, 1), 'double', True): ~965 MLUPS -(256, (32, 1), 'double', False): ~959 MLUPS -(256, (64, 1), 'single', True): ~960 MLUPS -(256, (64, 1), 'single', False): ~968 MLUPS -(256, (64, 1), 'double', True): ~967 MLUPS -(256, (64, 1), 'double', False): ~960 MLUPS -(256, (128, 1), 'single', True): ~955 MLUPS -(256, (128, 1), 'single', False): ~919 MLUPS -(256, (128, 1), 'double', True): ~960 MLUPS -(256, (128, 1), 'double', False): ~961 MLUPS -(256, (256, 1), 'single', True): ~965 MLUPS -(256, (256, 1), 'single', False): ~966 MLUPS -(256, (256, 1), 'double', True): ~970 MLUPS -(256, (256, 1), 'double', False): ~957 MLUPS -(512, (16, 1), 'single', True): ~3806 MLUPS -(512, (16, 1), 'single', False): ~2918 MLUPS -(512, (16, 1), 'double', True): ~3272 MLUPS -(512, (16, 1), 'double', False): ~1233 MLUPS -(512, (32, 1), 'single', True): ~3786 MLUPS -(512, (32, 1), 'single', False): ~3681 MLUPS -(512, (32, 1), 'double', True): ~3284 MLUPS -(512, (32, 1), 'double', False): ~2300 MLUPS -(512, (64, 1), 'single', True): ~3799 MLUPS -(512, (64, 1), 'single', False): ~3806 MLUPS -(512, (64, 1), 'double', True): ~3299 MLUPS -(512, (64, 1), 'double', False): ~2287 MLUPS -(512, (128, 1), 'single', True): ~3769 MLUPS -(512, (128, 1), 'single', False): ~3408 MLUPS -(512, (128, 1), 'double', True): ~3295 MLUPS -(512, (128, 1), 'double', False): ~2280 MLUPS -(512, (256, 1), 'single', True): ~3764 MLUPS -(512, (256, 1), 'single', False): ~3889 MLUPS -(512, (256, 1), 'double', True): ~3288 MLUPS -(512, (256, 1), 'double', False): ~2293 MLUPS -(512, (512, 1), 'single', True): ~3830 MLUPS -(512, (512, 1), 'single', False): ~3812 MLUPS -(512, (512, 1), 'double', True): ~3290 MLUPS -(512, (512, 1), 'double', False): ~2123 MLUPS -(1024, (16, 1), 'single', True): ~6332 MLUPS -(1024, (16, 1), 'single', False): ~3809 MLUPS -(1024, (16, 1), 'double', True): ~3473 MLUPS -(1024, (16, 1), 'double', False): ~1291 MLUPS -(1024, (32, 1), 'single', True): ~6641 MLUPS -(1024, (32, 1), 'single', False): ~6496 MLUPS -(1024, (32, 1), 'double', True): ~3470 MLUPS -(1024, (32, 1), 'double', False): ~2525 MLUPS -(1024, (64, 1), 'single', True): ~6588 MLUPS -(1024, (64, 1), 'single', False): ~6436 MLUPS -(1024, (64, 1), 'double', True): ~3450 MLUPS -(1024, (64, 1), 'double', False): ~2521 MLUPS -(1024, (128, 1), 'single', True): ~6605 MLUPS -(1024, (128, 1), 'single', False): ~6427 MLUPS -(1024, (128, 1), 'double', True): ~3449 MLUPS -(1024, (128, 1), 'double', False): ~2524 MLUPS -(1024, (256, 1), 'single', True): ~6602 MLUPS -(1024, (256, 1), 'single', False): ~6355 MLUPS -(1024, (256, 1), 'double', True): ~3456 MLUPS -(1024, (256, 1), 'double', False): ~2573 MLUPS -(1024, (512, 1), 'single', True): ~6594 MLUPS -(1024, (512, 1), 'single', False): ~6143 MLUPS -(1024, (512, 1), 'double', True): ~3464 MLUPS -(1024, (512, 1), 'double', False): ~2428 MLUPS -(1024, (1024, 1), 'single', True): ~6547 MLUPS -(1024, (1024, 1), 'single', False): ~5615 MLUPS -(1024, (1024, 1), 'double', True): ~3420 MLUPS -(1024, (1024, 1), 'double', False): ~2256 MLUPS -(2048, (16, 1), 'single', True): ~6513 MLUPS -(2048, (16, 1), 'double', True): ~3555 MLUPS -(2048, (32, 1), 'single', True): ~6723 MLUPS -(2048, (32, 1), 'double', True): ~3572 MLUPS -(2048, (64, 1), 'single', True): ~6766 MLUPS -(2048, (64, 1), 'double', True): ~3556 MLUPS -(2048, (128, 1), 'single', True): ~6790 MLUPS -(2048, (128, 1), 'double', True): ~3553 MLUPS -(2048, (256, 1), 'single', True): ~6794 MLUPS -(2048, (256, 1), 'double', True): ~3560 MLUPS -(2048, (512, 1), 'single', True): ~6802 MLUPS -(2048, (512, 1), 'double', True): ~3563 MLUPS -(2048, (1024, 1), 'single', True): ~6744 MLUPS -(2048, (1024, 1), 'double', True): ~3521 MLUPS -(4096, (16, 1), 'single', True): ~6636 MLUPS -(4096, (16, 1), 'double', True): ~3432 MLUPS -(4096, (32, 1), 'single', True): ~6910 MLUPS -(4096, (32, 1), 'double', True): ~3440 MLUPS -(4096, (64, 1), 'single', True): ~6852 MLUPS -(4096, (64, 1), 'double', True): ~3415 MLUPS -(4096, (128, 1), 'single', True): ~6875 MLUPS -(4096, (128, 1), 'double', True): ~3420 MLUPS -(4096, (256, 1), 'single', True): ~6882 MLUPS -(4096, (256, 1), 'double', True): ~3432 MLUPS -(4096, (512, 1), 'single', True): ~6890 MLUPS -(4096, (512, 1), 'double', True): ~3442 MLUPS -(4096, (1024, 1), 'single', True): ~6862 MLUPS -(4096, (1024, 1), 'double', True): ~3410 MLUPS +(32, (32, 1), 'single', False, True): ~13 MLUPS +(32, (32, 1), 'single', True, True): ~13 MLUPS +(32, (32, 1), 'double', False, True): ~13 MLUPS +(32, (32, 1), 'double', True, True): ~13 MLUPS +(32, (16, 1), 'single', False, True): ~13 MLUPS +(32, (16, 1), 'single', True, True): ~13 MLUPS +(32, (16, 1), 'double', False, True): ~13 MLUPS +(32, (16, 1), 'double', True, True): ~13 MLUPS +(256, (256, 1), 'single', False, True): ~852 MLUPS +(256, (256, 1), 'single', True, True): ~862 MLUPS +(256, (256, 1), 'double', False, True): ~847 MLUPS +(256, (256, 1), 'double', True, True): ~856 MLUPS +(256, (32, 1), 'single', False, True): ~862 MLUPS +(256, (32, 1), 'single', True, True): ~859 MLUPS +(256, (32, 1), 'double', False, True): ~851 MLUPS +(256, (32, 1), 'double', True, True): ~848 MLUPS +(256, (64, 1), 'single', False, True): ~813 MLUPS +(256, (64, 1), 'single', True, True): ~856 MLUPS +(256, (64, 1), 'double', False, True): ~849 MLUPS +(256, (64, 1), 'double', True, True): ~857 MLUPS +(256, (128, 1), 'single', False, True): ~952 MLUPS +(256, (128, 1), 'single', True, True): ~953 MLUPS +(256, (128, 1), 'double', False, True): ~938 MLUPS +(256, (128, 1), 'double', True, True): ~964 MLUPS +(256, (16, 1), 'single', False, True): ~950 MLUPS +(256, (16, 1), 'single', True, True): ~939 MLUPS +(256, (16, 1), 'double', False, True): ~935 MLUPS +(256, (16, 1), 'double', True, True): ~913 MLUPS +(64, (32, 1), 'single', False, True): ~56 MLUPS +(64, (32, 1), 'single', True, True): ~59 MLUPS +(64, (32, 1), 'double', False, True): ~58 MLUPS +(64, (32, 1), 'double', True, True): ~58 MLUPS +(64, (64, 1), 'single', False, True): ~58 MLUPS +(64, (64, 1), 'single', True, True): ~59 MLUPS +(64, (64, 1), 'double', False, True): ~57 MLUPS +(64, (64, 1), 'double', True, True): ~59 MLUPS +(64, (16, 1), 'single', False, True): ~59 MLUPS +(64, (16, 1), 'single', True, True): ~59 MLUPS +(64, (16, 1), 'double', False, True): ~59 MLUPS +(64, (16, 1), 'double', True, True): ~58 MLUPS +(128, (32, 1), 'single', False, True): ~213 MLUPS +(128, (32, 1), 'single', True, True): ~215 MLUPS +(128, (32, 1), 'double', False, True): ~213 MLUPS +(128, (32, 1), 'double', True, True): ~215 MLUPS +(128, (64, 1), 'single', False, True): ~215 MLUPS +(128, (64, 1), 'single', True, True): ~215 MLUPS +(128, (64, 1), 'double', False, True): ~215 MLUPS +(128, (64, 1), 'double', True, True): ~217 MLUPS +(128, (128, 1), 'single', False, True): ~216 MLUPS +(128, (128, 1), 'single', True, True): ~215 MLUPS +(128, (128, 1), 'double', False, True): ~213 MLUPS +(128, (128, 1), 'double', True, True): ~214 MLUPS +(128, (16, 1), 'single', False, True): ~214 MLUPS +(128, (16, 1), 'single', True, True): ~215 MLUPS +(128, (16, 1), 'double', False, True): ~213 MLUPS +(128, (16, 1), 'double', True, True): ~216 MLUPS +(512, (256, 1), 'single', False, True): ~3376 MLUPS +(512, (256, 1), 'single', True, True): ~3407 MLUPS +(512, (256, 1), 'double', False, True): ~2145 MLUPS +(512, (256, 1), 'double', True, True): ~3339 MLUPS +(512, (32, 1), 'single', False, True): ~3418 MLUPS +(512, (32, 1), 'single', True, True): ~3402 MLUPS +(512, (32, 1), 'double', False, True): ~2126 MLUPS +(512, (32, 1), 'double', True, True): ~3359 MLUPS +(512, (64, 1), 'single', False, True): ~3628 MLUPS +(512, (64, 1), 'single', True, True): ~3414 MLUPS +(512, (64, 1), 'double', False, True): ~2102 MLUPS +(512, (64, 1), 'double', True, True): ~3351 MLUPS +(512, (128, 1), 'single', False, True): ~3392 MLUPS +(512, (128, 1), 'single', True, True): ~3410 MLUPS +(512, (128, 1), 'double', False, True): ~1960 MLUPS +(512, (128, 1), 'double', True, True): ~3325 MLUPS +(512, (512, 1), 'single', False, True): ~3234 MLUPS +(512, (512, 1), 'single', True, True): ~3408 MLUPS +(512, (512, 1), 'double', False, True): ~2029 MLUPS +(512, (512, 1), 'double', True, True): ~3331 MLUPS +(512, (16, 1), 'single', False, True): ~3183 MLUPS +(512, (16, 1), 'single', True, True): ~3441 MLUPS +(512, (16, 1), 'double', False, True): ~1137 MLUPS +(512, (16, 1), 'double', True, True): ~3305 MLUPS +(1024, (256, 1), 'single', False, True): ~6302 MLUPS +(1024, (256, 1), 'single', True, True): ~6621 MLUPS +(1024, (256, 1), 'double', False, True): ~2637 MLUPS +(1024, (256, 1), 'double', True, True): ~3481 MLUPS +(1024, (32, 1), 'single', False, True): ~6603 MLUPS +(1024, (32, 1), 'single', True, True): ~6728 MLUPS +(1024, (32, 1), 'double', False, True): ~2608 MLUPS +(1024, (32, 1), 'double', True, True): ~3491 MLUPS +(1024, (64, 1), 'single', False, True): ~6552 MLUPS +(1024, (64, 1), 'single', True, True): ~6699 MLUPS +(1024, (64, 1), 'double', False, True): ~2604 MLUPS +(1024, (64, 1), 'double', True, True): ~3485 MLUPS +(1024, (128, 1), 'single', False, True): ~6478 MLUPS +(1024, (128, 1), 'single', True, True): ~6696 MLUPS +(1024, (128, 1), 'double', False, True): ~2606 MLUPS +(1024, (128, 1), 'double', True, True): ~3459 MLUPS +(1024, (512, 1), 'single', False, True): ~6184 MLUPS +(1024, (512, 1), 'single', True, True): ~6712 MLUPS +(1024, (512, 1), 'double', False, True): ~2573 MLUPS +(1024, (512, 1), 'double', True, True): ~3492 MLUPS +(1024, (1024, 1), 'single', False, True): ~5705 MLUPS +(1024, (1024, 1), 'single', True, True): ~6647 MLUPS +(1024, (1024, 1), 'double', False, True): ~2338 MLUPS +(1024, (1024, 1), 'double', True, True): ~3347 MLUPS +(1024, (16, 1), 'single', False, True): ~3873 MLUPS +(1024, (16, 1), 'single', True, True): ~6460 MLUPS +(1024, (16, 1), 'double', False, True): ~1333 MLUPS +(1024, (16, 1), 'double', True, True): ~3443 MLUPS +(2048, (256, 1), 'single', False, True): ~6762 MLUPS +(2048, (256, 1), 'single', True, True): ~6884 MLUPS +(2048, (256, 1), 'double', False, True): ~2814 MLUPS +(2048, (256, 1), 'double', True, True): ~3570 MLUPS +(2048, (32, 1), 'single', False, True): ~6957 MLUPS +(2048, (32, 1), 'single', True, True): ~6922 MLUPS +(2048, (32, 1), 'double', False, True): ~2714 MLUPS +(2048, (32, 1), 'double', True, True): ~3585 MLUPS +(2048, (64, 1), 'single', False, True): ~6865 MLUPS +(2048, (64, 1), 'single', True, True): ~6833 MLUPS +(2048, (64, 1), 'double', False, True): ~2644 MLUPS +(2048, (64, 1), 'double', True, True): ~3570 MLUPS +(2048, (128, 1), 'single', False, True): ~6809 MLUPS +(2048, (128, 1), 'single', True, True): ~6889 MLUPS +(2048, (128, 1), 'double', False, True): ~2719 MLUPS +(2048, (128, 1), 'double', True, True): ~3570 MLUPS +(2048, (512, 1), 'single', False, True): ~6585 MLUPS +(2048, (512, 1), 'single', True, True): ~6832 MLUPS +(2048, (512, 1), 'double', False, True): ~2732 MLUPS +(2048, (512, 1), 'double', True, True): ~3573 MLUPS +(2048, (1024, 1), 'single', False, True): ~6269 MLUPS +(2048, (1024, 1), 'single', True, True): ~6811 MLUPS +(2048, (1024, 1), 'double', False, True): ~2467 MLUPS +(2048, (1024, 1), 'double', True, True): ~3534 MLUPS +(2048, (16, 1), 'single', False, True): ~3905 MLUPS +(2048, (16, 1), 'single', True, True): ~6693 MLUPS +(2048, (16, 1), 'double', False, True): ~1367 MLUPS +(2048, (16, 1), 'double', True, True): ~3578 MLUPS +(800, (200, 1), 'single', True, False): ~6033 MLUPS +(800, (200, 1), 'single', True, True): ~6013 MLUPS +(800, (200, 1), 'double', True, False): ~3216 MLUPS +(800, (200, 1), 'double', True, True): ~3273 MLUPS +(800, (10, 1), 'single', True, False): ~4696 MLUPS +(800, (10, 1), 'single', True, True): ~4724 MLUPS +(800, (10, 1), 'double', True, False): ~3052 MLUPS +(800, (10, 1), 'double', True, True): ~3031 MLUPS +(800, (100, 1), 'single', True, False): ~5990 MLUPS +(800, (100, 1), 'single', True, True): ~5927 MLUPS +(800, (100, 1), 'double', True, False): ~3144 MLUPS +(800, (100, 1), 'double', True, True): ~3216 MLUPS +(800, (50, 1), 'single', True, False): ~5927 MLUPS +(800, (50, 1), 'single', True, True): ~5897 MLUPS +(800, (50, 1), 'double', True, False): ~3141 MLUPS +(800, (50, 1), 'double', True, True): ~3156 MLUPS +(100, (10, 1), 'single', True, False): ~144 MLUPS +(100, (10, 1), 'single', True, True): ~143 MLUPS +(100, (10, 1), 'double', True, False): ~142 MLUPS +(100, (10, 1), 'double', True, True): ~140 MLUPS +(100, (100, 1), 'single', True, False): ~143 MLUPS +(100, (100, 1), 'single', True, True): ~144 MLUPS +(100, (100, 1), 'double', True, False): ~140 MLUPS +(100, (100, 1), 'double', True, True): ~144 MLUPS +(100, (50, 1), 'single', True, False): ~141 MLUPS +(100, (50, 1), 'single', True, True): ~142 MLUPS +(100, (50, 1), 'double', True, False): ~147 MLUPS +(100, (50, 1), 'double', True, True): ~146 MLUPS +(200, (200, 1), 'single', True, False): ~576 MLUPS +(200, (200, 1), 'single', True, True): ~576 MLUPS +(200, (200, 1), 'double', True, False): ~573 MLUPS +(200, (200, 1), 'double', True, True): ~580 MLUPS +(200, (10, 1), 'single', True, False): ~582 MLUPS +(200, (10, 1), 'single', True, True): ~581 MLUPS +(200, (10, 1), 'double', True, False): ~580 MLUPS +(200, (10, 1), 'double', True, True): ~583 MLUPS +(200, (100, 1), 'single', True, False): ~584 MLUPS +(200, (100, 1), 'single', True, True): ~587 MLUPS +(200, (100, 1), 'double', True, False): ~580 MLUPS +(200, (100, 1), 'double', True, True): ~579 MLUPS +(200, (50, 1), 'single', True, False): ~583 MLUPS +(200, (50, 1), 'single', True, True): ~588 MLUPS +(200, (50, 1), 'double', True, False): ~578 MLUPS +(200, (50, 1), 'double', True, True): ~573 MLUPS +(1000, (200, 1), 'single', True, False): ~6442 MLUPS +(1000, (200, 1), 'single', True, True): ~6252 MLUPS +(1000, (200, 1), 'double', True, False): ~3312 MLUPS +(1000, (200, 1), 'double', True, True): ~3317 MLUPS +(1000, (10, 1), 'single', True, False): ~4990 MLUPS +(1000, (10, 1), 'single', True, True): ~4749 MLUPS +(1000, (10, 1), 'double', True, False): ~3130 MLUPS +(1000, (10, 1), 'double', True, True): ~3126 MLUPS +(1000, (100, 1), 'single', True, False): ~6348 MLUPS +(1000, (100, 1), 'single', True, True): ~6218 MLUPS +(1000, (100, 1), 'double', True, False): ~3327 MLUPS +(1000, (100, 1), 'double', True, True): ~3287 MLUPS +(1000, (50, 1), 'single', True, False): ~6318 MLUPS +(1000, (50, 1), 'single', True, True): ~6095 MLUPS +(1000, (50, 1), 'double', True, False): ~3242 MLUPS +(1000, (50, 1), 'double', True, True): ~3269 MLUPS +(400, (200, 1), 'single', True, False): ~2295 MLUPS +(400, (200, 1), 'single', True, True): ~2252 MLUPS +(400, (200, 1), 'double', True, False): ~2197 MLUPS +(400, (200, 1), 'double', True, True): ~2204 MLUPS +(400, (10, 1), 'single', True, False): ~2278 MLUPS +(400, (10, 1), 'single', True, True): ~2325 MLUPS +(400, (10, 1), 'double', True, False): ~2215 MLUPS +(400, (10, 1), 'double', True, True): ~2306 MLUPS +(400, (100, 1), 'single', True, False): ~2319 MLUPS +(400, (100, 1), 'single', True, True): ~2307 MLUPS +(400, (100, 1), 'double', True, False): ~2298 MLUPS +(400, (100, 1), 'double', True, True): ~2296 MLUPS +(400, (50, 1), 'single', True, False): ~2307 MLUPS +(400, (50, 1), 'single', True, True): ~2318 MLUPS +(400, (50, 1), 'double', True, False): ~2245 MLUPS +(400, (50, 1), 'double', True, True): ~2240 MLUPS +(50, (10, 1), 'single', True, False): ~35 MLUPS +(50, (10, 1), 'single', True, True): ~35 MLUPS +(50, (10, 1), 'double', True, False): ~35 MLUPS +(50, (10, 1), 'double', True, True): ~35 MLUPS +(50, (50, 1), 'single', True, False): ~35 MLUPS +(50, (50, 1), 'single', True, True): ~35 MLUPS +(50, (50, 1), 'double', True, False): ~33 MLUPS +(50, (50, 1), 'double', True, True): ~36 MLUPS +(600, (30, 1), 'single', True, False): ~5074 MLUPS +(600, (30, 1), 'single', True, True): ~5089 MLUPS +(600, (30, 1), 'double', True, False): ~3260 MLUPS +(600, (30, 1), 'double', True, True): ~3258 MLUPS +(600, (200, 1), 'single', True, False): ~5065 MLUPS +(600, (200, 1), 'single', True, True): ~5038 MLUPS +(600, (200, 1), 'double', True, False): ~3298 MLUPS +(600, (200, 1), 'double', True, True): ~3274 MLUPS +(600, (10, 1), 'single', True, False): ~4640 MLUPS +(600, (10, 1), 'single', True, True): ~4594 MLUPS +(600, (10, 1), 'double', True, False): ~3103 MLUPS +(600, (10, 1), 'double', True, True): ~3075 MLUPS +(600, (100, 1), 'single', True, False): ~5065 MLUPS +(600, (100, 1), 'single', True, True): ~5065 MLUPS +(600, (100, 1), 'double', True, False): ~3280 MLUPS +(600, (100, 1), 'double', True, True): ~3267 MLUPS +(600, (50, 1), 'single', True, False): ~5173 MLUPS +(600, (50, 1), 'single', True, True): ~5148 MLUPS +(600, (50, 1), 'double', True, False): ~3271 MLUPS +(600, (50, 1), 'double', True, True): ~3288 MLUPS +(800, (256, 1), 'single', True, True): ~6014 MLUPS +(800, (256, 1), 'double', True, True): ~3320 MLUPS +(800, (32, 1), 'single', True, True): ~6203 MLUPS +(800, (32, 1), 'double', True, True): ~3331 MLUPS +(800, (64, 1), 'single', True, True): ~6256 MLUPS +(800, (64, 1), 'double', True, True): ~3348 MLUPS +(800, (128, 1), 'single', True, True): ~6359 MLUPS +(800, (128, 1), 'double', True, True): ~3421 MLUPS +(800, (512, 1), 'single', True, True): ~6022 MLUPS +(800, (512, 1), 'double', True, True): ~3304 MLUPS +(800, (16, 1), 'single', True, True): ~5725 MLUPS +(800, (16, 1), 'double', True, True): ~3190 MLUPS +(100, (32, 1), 'single', True, True): ~147 MLUPS +(100, (32, 1), 'double', True, True): ~145 MLUPS +(100, (64, 1), 'single', True, True): ~145 MLUPS +(100, (64, 1), 'double', True, True): ~146 MLUPS +(100, (128, 1), 'single', True, True): ~145 MLUPS +(100, (128, 1), 'double', True, True): ~146 MLUPS +(100, (16, 1), 'single', True, True): ~148 MLUPS +(100, (16, 1), 'double', True, True): ~146 MLUPS +(200, (256, 1), 'single', True, True): ~583 MLUPS +(200, (256, 1), 'double', True, True): ~573 MLUPS +(200, (32, 1), 'single', True, True): ~580 MLUPS +(200, (32, 1), 'double', True, True): ~577 MLUPS +(200, (64, 1), 'single', True, True): ~579 MLUPS +(200, (64, 1), 'double', True, True): ~581 MLUPS +(200, (128, 1), 'single', True, True): ~579 MLUPS +(200, (128, 1), 'double', True, True): ~579 MLUPS +(200, (16, 1), 'single', True, True): ~574 MLUPS +(200, (16, 1), 'double', True, True): ~584 MLUPS +(1000, (256, 1), 'single', True, True): ~6403 MLUPS +(1000, (256, 1), 'double', True, True): ~3343 MLUPS +(1000, (32, 1), 'single', True, True): ~6414 MLUPS +(1000, (32, 1), 'double', True, True): ~3362 MLUPS +(1000, (64, 1), 'single', True, True): ~6300 MLUPS +(1000, (64, 1), 'double', True, True): ~3379 MLUPS +(1000, (128, 1), 'single', True, True): ~6342 MLUPS +(1000, (128, 1), 'double', True, True): ~3385 MLUPS +(1000, (512, 1), 'single', True, True): ~6401 MLUPS +(1000, (512, 1), 'double', True, True): ~3360 MLUPS +(1000, (1024, 1), 'single', True, True): ~6395 MLUPS +(1000, (1024, 1), 'double', True, True): ~3301 MLUPS +(1000, (16, 1), 'single', True, True): ~5847 MLUPS +(1000, (16, 1), 'double', True, True): ~3201 MLUPS +(400, (256, 1), 'single', True, True): ~2077 MLUPS +(400, (256, 1), 'double', True, True): ~2031 MLUPS +(400, (32, 1), 'single', True, True): ~2078 MLUPS +(400, (32, 1), 'double', True, True): ~2059 MLUPS +(400, (64, 1), 'single', True, True): ~2066 MLUPS +(400, (64, 1), 'double', True, True): ~2043 MLUPS +(400, (128, 1), 'single', True, True): ~2082 MLUPS +(400, (128, 1), 'double', True, True): ~2072 MLUPS +(400, (16, 1), 'single', True, True): ~2092 MLUPS +(400, (16, 1), 'double', True, True): ~2272 MLUPS +(50, (32, 1), 'single', True, True): ~32 MLUPS +(50, (32, 1), 'double', True, True): ~32 MLUPS +(50, (64, 1), 'single', True, True): ~32 MLUPS +(50, (64, 1), 'double', True, True): ~32 MLUPS +(50, (128, 1), 'single', True, True): ~32 MLUPS +(50, (128, 1), 'double', True, True): ~32 MLUPS +(50, (16, 1), 'single', True, True): ~32 MLUPS +(50, (16, 1), 'double', True, True): ~32 MLUPS +(600, (256, 1), 'single', True, True): ~4592 MLUPS +(600, (256, 1), 'double', True, True): ~3299 MLUPS +(600, (32, 1), 'single', True, True): ~4678 MLUPS +(600, (32, 1), 'double', True, True): ~3330 MLUPS +(600, (64, 1), 'single', True, True): ~4588 MLUPS +(600, (64, 1), 'double', True, True): ~3310 MLUPS +(600, (128, 1), 'single', True, True): ~4594 MLUPS +(600, (128, 1), 'double', True, True): ~3313 MLUPS +(600, (512, 1), 'single', True, True): ~4517 MLUPS +(600, (512, 1), 'double', True, True): ~3200 MLUPS +(600, (16, 1), 'single', True, True): ~4661 MLUPS +(600, (16, 1), 'double', True, True): ~3260 MLUPS diff --git a/result/ldc_2d_benchmark_P100.py b/result/ldc_2d_benchmark_P100.py index 50f5f9d..683d22d 100644 --- a/result/ldc_2d_benchmark_P100.py +++ b/result/ldc_2d_benchmark_P100.py @@ -1 +1 @@ -ldc_2d_p100 = [((32, (16, 1), 'single', True), [14, 14, 14, 14, 14, 14, 15, 14, 15, 14]), ((32, (16, 1), 'single', False), [15, 15, 15, 15, 15, 15, 15, 15, 15, 15]), ((32, (16, 1), 'double', True), [15, 15, 15, 15, 15, 15, 15, 15, 15, 15]), ((32, (16, 1), 'double', False), [15, 15, 15, 15, 15, 15, 15, 15, 15, 15]), ((32, (32, 1), 'single', True), [14, 15, 15, 15, 15, 15, 15, 15, 15, 15]), ((32, (32, 1), 'single', False), [15, 15, 15, 15, 15, 15, 15, 15, 15, 15]), ((32, (32, 1), 'double', True), [15, 15, 15, 15, 15, 15, 15, 15, 15, 15]), ((32, (32, 1), 'double', False), [15, 15, 15, 15, 15, 15, 15, 15, 15, 15]), ((64, (16, 1), 'single', True), [59, 59, 61, 59, 56, 56, 56, 58, 60, 61]), ((64, (16, 1), 'single', False), [58, 59, 60, 60, 60, 59, 59, 59, 59, 59]), ((64, (16, 1), 'double', True), [58, 59, 59, 60, 60, 59, 60, 59, 59, 60]), ((64, (16, 1), 'double', False), [56, 56, 56, 57, 57, 57, 57, 57, 57, 56]), ((64, (32, 1), 'single', True), [59, 60, 59, 60, 61, 60, 61, 60, 61, 61]), ((64, (32, 1), 'single', False), [59, 59, 60, 60, 60, 60, 60, 59, 60, 60]), ((64, (32, 1), 'double', True), [58, 60, 60, 59, 60, 60, 59, 60, 60, 59]), ((64, (32, 1), 'double', False), [57, 60, 59, 60, 61, 60, 59, 60, 60, 60]), ((64, (64, 1), 'single', True), [59, 60, 60, 60, 60, 59, 60, 61, 60, 61]), ((64, (64, 1), 'single', False), [58, 58, 59, 59, 59, 58, 56, 59, 56, 58]), ((64, (64, 1), 'double', True), [58, 60, 59, 60, 60, 61, 61, 60, 60, 60]), ((64, (64, 1), 'double', False), [59, 59, 59, 59, 59, 59, 60, 59, 60, 59]), ((96, (16, 1), 'single', True), [132, 132, 133, 131, 134, 134, 135, 134, 134, 134]), ((96, (16, 1), 'single', False), [132, 131, 132, 132, 135, 134, 132, 133, 133, 133]), ((96, (16, 1), 'double', True), [132, 133, 130, 133, 134, 134, 135, 133, 134, 133]), ((96, (16, 1), 'double', False), [126, 125, 128, 128, 126, 126, 123, 127, 126, 127]), ((96, (24, 1), 'single', True), [122, 124, 125, 126, 132, 135, 133, 128, 133, 133]), ((96, (24, 1), 'single', False), [132, 133, 135, 135, 134, 135, 135, 133, 132, 133]), ((96, (24, 1), 'double', True), [132, 135, 133, 135, 135, 135, 132, 135, 134, 135]), ((96, (24, 1), 'double', False), [133, 133, 134, 131, 135, 131, 136, 136, 133, 134]), ((96, (32, 1), 'single', True), [133, 136, 135, 135, 133, 137, 131, 135, 135, 134]), ((96, (32, 1), 'single', False), [132, 132, 134, 133, 133, 134, 134, 134, 132, 135]), ((96, (32, 1), 'double', True), [132, 135, 134, 136, 135, 135, 136, 134, 136, 135]), ((96, (32, 1), 'double', False), [129, 133, 134, 136, 137, 135, 136, 132, 134, 136]), ((96, (48, 1), 'single', True), [129, 133, 131, 132, 133, 134, 135, 136, 134, 135]), ((96, (48, 1), 'single', False), [133, 135, 135, 136, 135, 135, 136, 135, 135, 135]), ((96, (48, 1), 'double', True), [134, 136, 136, 135, 137, 137, 136, 136, 135, 137]), ((96, (48, 1), 'double', False), [132, 134, 134, 134, 132, 133, 134, 135, 134, 133]), ((96, (96, 1), 'single', True), [135, 137, 135, 137, 137, 136, 138, 137, 137, 136]), ((96, (96, 1), 'single', False), [134, 134, 136, 135, 137, 138, 137, 136, 135, 137]), ((96, (96, 1), 'double', True), [134, 135, 136, 137, 136, 137, 138, 138, 137, 139]), ((96, (96, 1), 'double', False), [134, 136, 137, 136, 136, 137, 135, 137, 138, 135]), ((128, (16, 1), 'single', True), [238, 234, 238, 243, 243, 244, 242, 244, 240, 238]), ((128, (16, 1), 'single', False), [218, 218, 222, 222, 222, 221, 221, 222, 221, 220]), ((128, (16, 1), 'double', True), [227, 229, 229, 229, 223, 216, 218, 219, 212, 220]), ((128, (16, 1), 'double', False), [201, 205, 204, 204, 205, 205, 205, 204, 205, 204]), ((128, (32, 1), 'single', True), [214, 215, 214, 217, 219, 217, 217, 221, 230, 224]), ((128, (32, 1), 'single', False), [236, 239, 240, 236, 235, 236, 235, 236, 238, 240]), ((128, (32, 1), 'double', True), [237, 241, 240, 241, 241, 237, 241, 241, 242, 243]), ((128, (32, 1), 'double', False), [239, 244, 243, 241, 244, 243, 244, 244, 243, 241]), ((128, (64, 1), 'single', True), [239, 242, 241, 243, 242, 242, 242, 242, 242, 236]), ((128, (64, 1), 'single', False), [237, 241, 241, 239, 239, 240, 242, 241, 241, 239]), ((128, (64, 1), 'double', True), [240, 240, 241, 243, 240, 242, 242, 244, 240, 245]), ((128, (64, 1), 'double', False), [234, 237, 231, 237, 236, 241, 240, 239, 242, 240]), ((128, (128, 1), 'single', True), [236, 241, 238, 237, 240, 243, 242, 240, 240, 242]), ((128, (128, 1), 'single', False), [238, 239, 235, 242, 235, 240, 238, 239, 240, 238]), ((128, (128, 1), 'double', True), [238, 238, 241, 239, 238, 239, 239, 238, 237, 235]), ((128, (128, 1), 'double', False), [239, 236, 242, 238, 243, 238, 237, 238, 234, 241]), ((256, (16, 1), 'single', True), [937, 948, 946, 955, 960, 957, 963, 960, 956, 954]), ((256, (16, 1), 'single', False), [926, 932, 943, 929, 931, 929, 933, 928, 930, 944]), ((256, (16, 1), 'double', True), [944, 958, 957, 955, 960, 957, 960, 955, 966, 963]), ((256, (16, 1), 'double', False), [902, 901, 898, 905, 916, 919, 911, 907, 904, 900]), ((256, (32, 1), 'single', True), [960, 954, 974, 979, 981, 982, 978, 975, 970, 976]), ((256, (32, 1), 'single', False), [952, 956, 970, 971, 960, 968, 966, 955, 967, 971]), ((256, (32, 1), 'double', True), [946, 946, 968, 972, 975, 972, 962, 974, 972, 970]), ((256, (32, 1), 'double', False), [955, 955, 962, 943, 958, 957, 962, 967, 965, 974]), ((256, (64, 1), 'single', True), [943, 960, 937, 966, 966, 964, 969, 970, 970, 964]), ((256, (64, 1), 'single', False), [953, 965, 963, 971, 966, 975, 974, 972, 974, 971]), ((256, (64, 1), 'double', True), [961, 974, 934, 968, 975, 977, 958, 975, 974, 974]), ((256, (64, 1), 'double', False), [947, 961, 962, 957, 964, 966, 951, 967, 969, 958]), ((256, (128, 1), 'single', True), [942, 953, 932, 962, 965, 960, 964, 963, 955, 963]), ((256, (128, 1), 'single', False), [944, 960, 917, 946, 833, 803, 902, 965, 958, 962]), ((256, (128, 1), 'double', True), [931, 950, 969, 973, 976, 969, 960, 951, 970, 958]), ((256, (128, 1), 'double', False), [948, 958, 966, 970, 955, 959, 960, 969, 962, 967]), ((256, (256, 1), 'single', True), [933, 964, 966, 956, 974, 973, 971, 974, 972, 971]), ((256, (256, 1), 'single', False), [953, 970, 970, 970, 966, 962, 971, 964, 969, 965]), ((256, (256, 1), 'double', True), [952, 966, 970, 968, 972, 972, 971, 974, 981, 976]), ((256, (256, 1), 'double', False), [937, 956, 956, 959, 961, 964, 966, 948, 966, 958]), ((512, (16, 1), 'single', True), [3758, 3817, 3803, 3814, 3816, 3811, 3804, 3808, 3807, 3830]), ((512, (16, 1), 'single', False), [3289, 3027, 2960, 2908, 2856, 2829, 2830, 2827, 2831, 2832]), ((512, (16, 1), 'double', True), [3252, 3265, 3278, 3277, 3277, 3277, 3275, 3275, 3274, 3278]), ((512, (16, 1), 'double', False), [1303, 1256, 1225, 1220, 1221, 1222, 1221, 1221, 1222, 1222]), ((512, (32, 1), 'single', True), [3768, 3788, 3814, 3816, 3829, 3788, 3707, 3770, 3809, 3773]), ((512, (32, 1), 'single', False), [3729, 3795, 2896, 3638, 3745, 3759, 3799, 3823, 3810, 3824]), ((512, (32, 1), 'double', True), [3270, 3294, 3295, 3285, 3279, 3283, 3288, 3284, 3281, 3283]), ((512, (32, 1), 'double', False), [2381, 2322, 2286, 2285, 2284, 2288, 2289, 2290, 2286, 2289]), ((512, (64, 1), 'single', True), [3718, 3773, 3809, 3809, 3794, 3815, 3784, 3837, 3829, 3823]), ((512, (64, 1), 'single', False), [3747, 3796, 3799, 3826, 3809, 3820, 3773, 3837, 3837, 3818]), ((512, (64, 1), 'double', True), [3282, 3303, 3299, 3304, 3303, 3306, 3293, 3302, 3298, 3304]), ((512, (64, 1), 'double', False), [2372, 2315, 2274, 2269, 2270, 2276, 2276, 2274, 2276, 2274]), ((512, (128, 1), 'single', True), [3667, 3760, 3805, 3790, 3766, 3763, 3756, 3821, 3770, 3793]), ((512, (128, 1), 'single', False), [2337, 3498, 3708, 3639, 3708, 3511, 2649, 3632, 3681, 3725]), ((512, (128, 1), 'double', True), [3275, 3298, 3298, 3297, 3300, 3298, 3301, 3296, 3296, 3295]), ((512, (128, 1), 'double', False), [2368, 2313, 2265, 2264, 2263, 2263, 2265, 2267, 2267, 2268]), ((512, (256, 1), 'single', True), [3684, 3785, 3654, 3725, 3774, 3816, 3799, 3819, 3790, 3800]), ((512, (256, 1), 'single', False), [3831, 3853, 3903, 3884, 3897, 3906, 3893, 3906, 3914, 3906]), ((512, (256, 1), 'double', True), [3270, 3290, 3291, 3292, 3290, 3285, 3290, 3291, 3292, 3290]), ((512, (256, 1), 'double', False), [2378, 2325, 2279, 2266, 2275, 2277, 2281, 2278, 2289, 2289]), ((512, (512, 1), 'single', True), [3762, 3819, 3827, 3839, 3825, 3844, 3822, 3863, 3856, 3846]), ((512, (512, 1), 'single', False), [3757, 3810, 3803, 3828, 3777, 3820, 3831, 3829, 3840, 3826]), ((512, (512, 1), 'double', True), [3272, 3294, 3288, 3292, 3296, 3295, 3292, 3292, 3290, 3292]), ((512, (512, 1), 'double', False), [2196, 2126, 2115, 2113, 2114, 2113, 2115, 2113, 2115, 2113]), ((1024, (16, 1), 'single', True), [6315, 6335, 6334, 6333, 6333, 6331, 6336, 6335, 6335, 6337]), ((1024, (16, 1), 'single', False), [3978, 3949, 3913, 3869, 3825, 3785, 3749, 3713, 3676, 3641]), ((1024, (16, 1), 'double', True), [3470, 3473, 3473, 3471, 3474, 3474, 3474, 3474, 3475, 3473]), ((1024, (16, 1), 'double', False), [1380, 1344, 1319, 1297, 1276, 1262, 1262, 1263, 1260, 1256]), ((1024, (32, 1), 'single', True), [6628, 6642, 6636, 6640, 6644, 6645, 6648, 6644, 6644, 6645]), ((1024, (32, 1), 'single', False), [6493, 6510, 6510, 6507, 6499, 6499, 6494, 6483, 6489, 6480]), ((1024, (32, 1), 'double', True), [3461, 3472, 3472, 3473, 3472, 3473, 3469, 3471, 3473, 3472]), ((1024, (32, 1), 'double', False), [2673, 2615, 2571, 2529, 2492, 2469, 2474, 2476, 2479, 2480]), ((1024, (64, 1), 'single', True), [6575, 6592, 6587, 6591, 6581, 6587, 6595, 6594, 6593, 6591]), ((1024, (64, 1), 'single', False), [6418, 6454, 6450, 6446, 6443, 6432, 6429, 6431, 6429, 6431]), ((1024, (64, 1), 'double', True), [3440, 3448, 3452, 3451, 3453, 3455, 3451, 3457, 3451, 3450]), ((1024, (64, 1), 'double', False), [2668, 2610, 2565, 2524, 2487, 2466, 2469, 2473, 2475, 2474]), ((1024, (128, 1), 'single', True), [6577, 6609, 6610, 6608, 6609, 6609, 6604, 6609, 6613, 6606]), ((1024, (128, 1), 'single', False), [6402, 6443, 6448, 6441, 6436, 6434, 6421, 6419, 6421, 6410]), ((1024, (128, 1), 'double', True), [3446, 3451, 3451, 3449, 3450, 3451, 3448, 3451, 3450, 3451]), ((1024, (128, 1), 'double', False), [2672, 2618, 2573, 2531, 2491, 2467, 2469, 2473, 2475, 2476]), ((1024, (256, 1), 'single', True), [6589, 6605, 6604, 6605, 6603, 6606, 6604, 6607, 6597, 6601]), ((1024, (256, 1), 'single', False), [6365, 6391, 6384, 6367, 6362, 6348, 6349, 6337, 6342, 6314]), ((1024, (256, 1), 'double', True), [3454, 3457, 3456, 3455, 3457, 3456, 3457, 3458, 3456, 3456]), ((1024, (256, 1), 'double', False), [2709, 2651, 2631, 2577, 2540, 2516, 2525, 2526, 2527, 2528]), ((1024, (512, 1), 'single', True), [6584, 6595, 6592, 6598, 6599, 6592, 6598, 6588, 6602, 6594]), ((1024, (512, 1), 'single', False), [6166, 6202, 6187, 6175, 6153, 6146, 6129, 6131, 6098, 6050]), ((1024, (512, 1), 'double', True), [3461, 3463, 3465, 3465, 3465, 3465, 3464, 3466, 3465, 3464]), ((1024, (512, 1), 'double', False), [2613, 2539, 2490, 2447, 2405, 2359, 2357, 2358, 2357, 2358]), ((1024, (1024, 1), 'single', True), [6536, 6547, 6545, 6551, 6551, 6552, 6550, 6546, 6549, 6547]), ((1024, (1024, 1), 'single', False), [5703, 5711, 5692, 5667, 5630, 5589, 5574, 5564, 5530, 5497]), ((1024, (1024, 1), 'double', True), [3417, 3421, 3420, 3420, 3421, 3421, 3422, 3422, 3421, 3423]), ((1024, (1024, 1), 'double', False), [2346, 2322, 2301, 2274, 2241, 2215, 2216, 2217, 2219, 2218]), ((2048, (16, 1), 'single', True), [6450, 6508, 6522, 6523, 6523, 6524, 6522, 6522, 6524, 6521]), ((2048, (16, 1), 'double', True), [3552, 3556, 3555, 3555, 3555, 3555, 3555, 3556, 3555, 3556]), ((2048, (32, 1), 'single', True), [6813, 6829, 6831, 6831, 6831, 6830, 6831, 6831, 5781, 6829]), ((2048, (32, 1), 'double', True), [3569, 3573, 3574, 3573, 3574, 3574, 3572, 3573, 3573, 3573]), ((2048, (64, 1), 'single', True), [6756, 6774, 6771, 6765, 6765, 6767, 6766, 6768, 6766, 6767]), ((2048, (64, 1), 'double', True), [3552, 3557, 3557, 3557, 3557, 3557, 3557, 3558, 3557, 3557]), ((2048, (128, 1), 'single', True), [6780, 6794, 6791, 6793, 6791, 6793, 6792, 6791, 6791, 6793]), ((2048, (128, 1), 'double', True), [3551, 3554, 3554, 3553, 3552, 3554, 3554, 3554, 3555, 3555]), ((2048, (256, 1), 'single', True), [6788, 6794, 6795, 6795, 6795, 6795, 6796, 6796, 6796, 6797]), ((2048, (256, 1), 'double', True), [3565, 3562, 3560, 3559, 3559, 3560, 3560, 3560, 3560, 3559]), ((2048, (512, 1), 'single', True), [6795, 6803, 6802, 6804, 6805, 6803, 6804, 6803, 6804, 6803]), ((2048, (512, 1), 'double', True), [3559, 3563, 3563, 3564, 3564, 3564, 3564, 3563, 3564, 3564]), ((2048, (1024, 1), 'single', True), [6740, 6745, 6746, 6747, 6748, 6745, 6734, 6746, 6745, 6746]), ((2048, (1024, 1), 'double', True), [3518, 3522, 3522, 3522, 3522, 3522, 3522, 3522, 3522, 3522]), ((4096, (16, 1), 'single', True), [6564, 6583, 6583, 6583, 6584, 6583, 6583, 6583, 6584, 6583]), ((4096, (16, 1), 'double', True), [3444, 3442, 3442, 3442, 3442, 3442, 3442, 3442, 3442, 3442]), ((4096, (32, 1), 'single', True), [6972, 6963, 6963, 6963, 6963, 6963, 6963, 6961, 6959, 6963]), ((4096, (32, 1), 'double', True), [3462, 3459, 3460, 3460, 3460, 3460, 3459, 3459, 3459, 3459]), ((4096, (64, 1), 'single', True), [6897, 6902, 6901, 6901, 6902, 6901, 6900, 6901, 6902, 6901]), ((4096, (64, 1), 'double', True), [3437, 3438, 3438, 3438, 3438, 3438, 3438, 3438, 3438, 3438]), ((4096, (128, 1), 'single', True), [6925, 6923, 6923, 6923, 6923, 6923, 6923, 6923, 6924, 6923]), ((4096, (128, 1), 'double', True), [3421, 3420, 3419, 3420, 3420, 3420, 3420, 3420, 3420, 3420]), ((4096, (256, 1), 'single', True), [6896, 6881, 6881, 6882, 6882, 6881, 6882, 6882, 6881, 6881]), ((4096, (256, 1), 'double', True), [3433, 3433, 3433, 3434, 3433, 3433, 3433, 3433, 3433, 3433]), ((4096, (512, 1), 'single', True), [6900, 6890, 6890, 6889, 6889, 6890, 6890, 6890, 6890, 6889]), ((4096, (512, 1), 'double', True), [3444, 3442, 3442, 3442, 3442, 3442, 3442, 3442, 3442, 3442]), ((4096, (1024, 1), 'single', True), [6872, 6861, 6861, 6861, 6861, 6860, 6860, 6861, 6861, 6861]), ((4096, (1024, 1), 'double', True), [3410, 3410, 3410, 3411, 3411, 3411, 3411, 3411, 3411, 3410])] +ldc_2d_p100 = [((32, (32, 1), 'single', False, True), [13, 14, 14, 14, 14]), ((32, (32, 1), 'single', True, True), [13, 14, 14, 14, 14]), ((32, (32, 1), 'double', False, True), [13, 13, 13, 14, 14]), ((32, (32, 1), 'double', True, True), [13, 14, 13, 13, 14]), ((32, (16, 1), 'single', False, True), [13, 14, 14, 14, 14]), ((32, (16, 1), 'single', True, True), [13, 13, 13, 13, 13]), ((32, (16, 1), 'double', False, True), [13, 14, 14, 13, 14]), ((32, (16, 1), 'double', True, True), [13, 14, 14, 13, 14]), ((256, (256, 1), 'single', False, True), [840, 857, 850, 857, 857]), ((256, (256, 1), 'single', True, True), [853, 860, 867, 866, 864]), ((256, (256, 1), 'double', False, True), [839, 849, 850, 848, 852]), ((256, (256, 1), 'double', True, True), [840, 862, 860, 858, 862]), ((256, (32, 1), 'single', False, True), [856, 866, 851, 868, 871]), ((256, (32, 1), 'single', True, True), [853, 863, 863, 856, 861]), ((256, (32, 1), 'double', False, True), [840, 857, 855, 853, 854]), ((256, (32, 1), 'double', True, True), [832, 851, 849, 856, 856]), ((256, (64, 1), 'single', False, True), [822, 840, 831, 791, 783]), ((256, (64, 1), 'single', True, True), [848, 859, 856, 859, 860]), ((256, (64, 1), 'double', False, True), [836, 850, 852, 856, 852]), ((256, (64, 1), 'double', True, True), [847, 863, 860, 859, 857]), ((256, (128, 1), 'single', False, True), [942, 947, 953, 957, 962]), ((256, (128, 1), 'single', True, True), [937, 960, 950, 953, 965]), ((256, (128, 1), 'double', False, True), [916, 947, 954, 946, 931]), ((256, (128, 1), 'double', True, True), [940, 969, 965, 969, 980]), ((256, (16, 1), 'single', False, True), [938, 960, 935, 963, 955]), ((256, (16, 1), 'single', True, True), [926, 951, 938, 948, 933]), ((256, (16, 1), 'double', False, True), [929, 937, 944, 942, 927]), ((256, (16, 1), 'double', True, True), [894, 919, 916, 918, 918]), ((64, (32, 1), 'single', False, True), [56, 57, 57, 57, 57]), ((64, (32, 1), 'single', True, True), [59, 60, 59, 60, 60]), ((64, (32, 1), 'double', False, True), [57, 58, 59, 59, 59]), ((64, (32, 1), 'double', True, True), [58, 59, 59, 59, 59]), ((64, (64, 1), 'single', False, True), [58, 58, 59, 59, 59]), ((64, (64, 1), 'single', True, True), [58, 59, 60, 58, 60]), ((64, (64, 1), 'double', False, True), [54, 56, 59, 59, 59]), ((64, (64, 1), 'double', True, True), [59, 60, 59, 59, 59]), ((64, (16, 1), 'single', False, True), [59, 60, 58, 60, 60]), ((64, (16, 1), 'single', True, True), [59, 60, 59, 60, 61]), ((64, (16, 1), 'double', False, True), [58, 59, 59, 59, 60]), ((64, (16, 1), 'double', True, True), [58, 59, 60, 60, 57]), ((128, (32, 1), 'single', False, True), [213, 216, 211, 214, 215]), ((128, (32, 1), 'single', True, True), [213, 215, 216, 216, 218]), ((128, (32, 1), 'double', False, True), [211, 214, 213, 214, 215]), ((128, (32, 1), 'double', True, True), [213, 217, 216, 216, 217]), ((128, (64, 1), 'single', False, True), [213, 217, 217, 216, 216]), ((128, (64, 1), 'single', True, True), [213, 217, 217, 216, 215]), ((128, (64, 1), 'double', False, True), [214, 213, 216, 217, 218]), ((128, (64, 1), 'double', True, True), [215, 216, 218, 218, 218]), ((128, (128, 1), 'single', False, True), [214, 217, 218, 217, 217]), ((128, (128, 1), 'single', True, True), [213, 216, 215, 217, 218]), ((128, (128, 1), 'double', False, True), [210, 214, 215, 215, 215]), ((128, (128, 1), 'double', True, True), [212, 215, 215, 215, 214]), ((128, (16, 1), 'single', False, True), [212, 214, 215, 214, 215]), ((128, (16, 1), 'single', True, True), [214, 215, 216, 217, 217]), ((128, (16, 1), 'double', False, True), [212, 214, 214, 214, 212]), ((128, (16, 1), 'double', True, True), [215, 215, 217, 218, 219]), ((512, (256, 1), 'single', False, True), [3342, 3382, 3385, 3387, 3386]), ((512, (256, 1), 'single', True, True), [3382, 3411, 3429, 3429, 3385]), ((512, (256, 1), 'double', False, True), [2254, 2187, 2107, 2089, 2089]), ((512, (256, 1), 'double', True, True), [3307, 3344, 3347, 3348, 3350]), ((512, (32, 1), 'single', False, True), [3390, 3418, 3406, 3434, 3446]), ((512, (32, 1), 'single', True, True), [3360, 3409, 3415, 3419, 3407]), ((512, (32, 1), 'double', False, True), [2238, 2160, 2087, 2073, 2075]), ((512, (32, 1), 'double', True, True), [3329, 3366, 3366, 3369, 3368]), ((512, (64, 1), 'single', False, True), [3586, 3598, 3639, 3652, 3669]), ((512, (64, 1), 'single', True, True), [3356, 3425, 3425, 3435, 3429]), ((512, (64, 1), 'double', False, True), [2204, 2138, 2063, 2046, 2059]), ((512, (64, 1), 'double', True, True), [3313, 3359, 3364, 3358, 3365]), ((512, (128, 1), 'single', False, True), [3328, 3408, 3410, 3410, 3408]), ((512, (128, 1), 'single', True, True), [3368, 3431, 3412, 3425, 3418]), ((512, (128, 1), 'double', False, True), [2060, 1997, 1925, 1909, 1910]), ((512, (128, 1), 'double', True, True), [3307, 3322, 3332, 3331, 3334]), ((512, (512, 1), 'single', False, True), [3375, 3415, 2523, 3422, 3436]), ((512, (512, 1), 'single', True, True), [3369, 3409, 3409, 3420, 3433]), ((512, (512, 1), 'double', False, True), [2124, 2069, 2006, 1973, 1975]), ((512, (512, 1), 'double', True, True), [3301, 3323, 3346, 3342, 3343]), ((512, (16, 1), 'single', False, True), [3270, 3257, 3192, 3129, 3070]), ((512, (16, 1), 'single', True, True), [3409, 3444, 3453, 3453, 3446]), ((512, (16, 1), 'double', False, True), [1204, 1160, 1115, 1103, 1103]), ((512, (16, 1), 'double', True, True), [3281, 3310, 3311, 3311, 3316]), ((1024, (256, 1), 'single', False, True), [6327, 6343, 6308, 6283, 6253]), ((1024, (256, 1), 'single', True, True), [6601, 6627, 6626, 6627, 6624]), ((1024, (256, 1), 'double', False, True), [2729, 2683, 2631, 2597, 2549]), ((1024, (256, 1), 'double', True, True), [3475, 3482, 3482, 3483, 3483]), ((1024, (32, 1), 'single', False, True), [6582, 6622, 6614, 6603, 6598]), ((1024, (32, 1), 'single', True, True), [6711, 6732, 6732, 6735, 6731]), ((1024, (32, 1), 'double', False, True), [2701, 2658, 2613, 2561, 2507]), ((1024, (32, 1), 'double', True, True), [3489, 3493, 3490, 3492, 3491]), ((1024, (64, 1), 'single', False, True), [6530, 6565, 6564, 6558, 6546]), ((1024, (64, 1), 'single', True, True), [6688, 6698, 6704, 6703, 6703]), ((1024, (64, 1), 'double', False, True), [2696, 2655, 2609, 2557, 2503]), ((1024, (64, 1), 'double', True, True), [3483, 3485, 3487, 3487, 3486]), ((1024, (128, 1), 'single', False, True), [6460, 6494, 6486, 6481, 6473]), ((1024, (128, 1), 'single', True, True), [6686, 6701, 6697, 6699, 6697]), ((1024, (128, 1), 'double', False, True), [2697, 2656, 2612, 2561, 2506]), ((1024, (128, 1), 'double', True, True), [3457, 3460, 3460, 3460, 3460]), ((1024, (512, 1), 'single', False, True), [6188, 6205, 6191, 6177, 6159]), ((1024, (512, 1), 'single', True, True), [6697, 6707, 6718, 6721, 6717]), ((1024, (512, 1), 'double', False, True), [2665, 2650, 2596, 2514, 2443]), ((1024, (512, 1), 'double', True, True), [3489, 3494, 3493, 3494, 3494]), ((1024, (1024, 1), 'single', False, True), [5747, 5732, 5712, 5681, 5654]), ((1024, (1024, 1), 'single', True, True), [6636, 6647, 6652, 6650, 6651]), ((1024, (1024, 1), 'double', False, True), [2410, 2374, 2342, 2304, 2262]), ((1024, (1024, 1), 'double', True, True), [3344, 3349, 3349, 3348, 3349]), ((1024, (16, 1), 'single', False, True), [3949, 3914, 3876, 3834, 3793]), ((1024, (16, 1), 'single', True, True), [6451, 6461, 6462, 6464, 6462]), ((1024, (16, 1), 'double', False, True), [1385, 1358, 1335, 1309, 1282]), ((1024, (16, 1), 'double', True, True), [3441, 3444, 3445, 3444, 3443]), ((2048, (256, 1), 'single', False, True), [6674, 6714, 6776, 6827, 6822]), ((2048, (256, 1), 'single', True, True), [6879, 6886, 6886, 6886, 6886]), ((2048, (256, 1), 'double', False, True), [2845, 2826, 2817, 2806, 2778]), ((2048, (256, 1), 'double', True, True), [3569, 3571, 3570, 3571, 3571]), ((2048, (32, 1), 'single', False, True), [6954, 6961, 6959, 6958, 6955]), ((2048, (32, 1), 'single', True, True), [6924, 6933, 6924, 6916, 6915]), ((2048, (32, 1), 'double', False, True), [2757, 2735, 2716, 2694, 2671]), ((2048, (32, 1), 'double', True, True), [3582, 3586, 3586, 3586, 3585]), ((2048, (64, 1), 'single', False, True), [6859, 6869, 6868, 6866, 6865]), ((2048, (64, 1), 'single', True, True), [6825, 6835, 6837, 6836, 6836]), ((2048, (64, 1), 'double', False, True), [2498, 2661, 2697, 2694, 2671]), ((2048, (64, 1), 'double', True, True), [3569, 3570, 3571, 3571, 3570]), ((2048, (128, 1), 'single', False, True), [6801, 6815, 6813, 6811, 6808]), ((2048, (128, 1), 'single', True, True), [6884, 6890, 6891, 6891, 6890]), ((2048, (128, 1), 'double', False, True), [2760, 2739, 2720, 2700, 2677]), ((2048, (128, 1), 'double', True, True), [3569, 3571, 3571, 3572, 3571]), ((2048, (512, 1), 'single', False, True), [6293, 6613, 6657, 6668, 6696]), ((2048, (512, 1), 'single', True, True), [6827, 6833, 6834, 6834, 6834]), ((2048, (512, 1), 'double', False, True), [2781, 2757, 2736, 2708, 2679]), ((2048, (512, 1), 'double', True, True), [3570, 3574, 3574, 3574, 3574]), ((2048, (1024, 1), 'single', False, True), [6290, 6291, 6274, 6258, 6234]), ((2048, (1024, 1), 'single', True, True), [6802, 6812, 6813, 6815, 6813]), ((2048, (1024, 1), 'double', False, True), [2405, 2494, 2495, 2481, 2464]), ((2048, (1024, 1), 'double', True, True), [3532, 3535, 3536, 3535, 3535]), ((2048, (16, 1), 'single', False, True), [3944, 3926, 3907, 3886, 3864]), ((2048, (16, 1), 'single', True, True), [6684, 6695, 6696, 6695, 6696]), ((2048, (16, 1), 'double', False, True), [1392, 1376, 1367, 1356, 1345]), ((2048, (16, 1), 'double', True, True), [3585, 3582, 3576, 3575, 3575]), ((800, (200, 1), 'single', True, False), [5980, 6047, 6045, 6051, 6044]), ((800, (200, 1), 'single', True, True), [5997, 6022, 6023, 6010, 6017]), ((800, (200, 1), 'double', True, False), [3211, 3219, 3218, 3217, 3219]), ((800, (200, 1), 'double', True, True), [3265, 3277, 3276, 3276, 3275]), ((800, (10, 1), 'single', True, False), [4672, 4707, 4702, 4702, 4700]), ((800, (10, 1), 'single', True, True), [4713, 4726, 4728, 4729, 4726]), ((800, (10, 1), 'double', True, False), [3049, 3054, 3054, 3051, 3053]), ((800, (10, 1), 'double', True, True), [3028, 3034, 3032, 3032, 3032]), ((800, (100, 1), 'single', True, False), [5961, 5997, 5997, 5998, 6000]), ((800, (100, 1), 'single', True, True), [5842, 5951, 5954, 5940, 5949]), ((800, (100, 1), 'double', True, False), [3140, 3145, 3146, 3147, 3144]), ((800, (100, 1), 'double', True, True), [3210, 3215, 3220, 3218, 3219]), ((800, (50, 1), 'single', True, False), [5907, 5932, 5933, 5934, 5932]), ((800, (50, 1), 'single', True, True), [5871, 5900, 5901, 5909, 5907]), ((800, (50, 1), 'double', True, False), [3137, 3143, 3142, 3140, 3144]), ((800, (50, 1), 'double', True, True), [3152, 3154, 3158, 3159, 3158]), ((100, (10, 1), 'single', True, False), [144, 142, 146, 145, 146]), ((100, (10, 1), 'single', True, True), [143, 145, 144, 143, 142]), ((100, (10, 1), 'double', True, False), [138, 144, 142, 145, 142]), ((100, (10, 1), 'double', True, True), [138, 142, 141, 139, 142]), ((100, (100, 1), 'single', True, False), [143, 144, 142, 144, 145]), ((100, (100, 1), 'single', True, True), [141, 145, 144, 144, 146]), ((100, (100, 1), 'double', True, False), [135, 141, 144, 143, 141]), ((100, (100, 1), 'double', True, True), [143, 146, 145, 144, 146]), ((100, (50, 1), 'single', True, False), [141, 143, 140, 142, 143]), ((100, (50, 1), 'single', True, True), [139, 143, 143, 144, 145]), ((100, (50, 1), 'double', True, False), [145, 147, 148, 148, 147]), ((100, (50, 1), 'double', True, True), [144, 146, 147, 146, 147]), ((200, (200, 1), 'single', True, False), [569, 578, 576, 581, 580]), ((200, (200, 1), 'single', True, True), [572, 575, 576, 578, 582]), ((200, (200, 1), 'double', True, False), [566, 577, 572, 573, 577]), ((200, (200, 1), 'double', True, True), [572, 583, 581, 580, 588]), ((200, (10, 1), 'single', True, False), [570, 585, 587, 586, 586]), ((200, (10, 1), 'single', True, True), [570, 579, 585, 586, 586]), ((200, (10, 1), 'double', True, False), [574, 583, 580, 580, 584]), ((200, (10, 1), 'double', True, True), [576, 585, 585, 585, 587]), ((200, (100, 1), 'single', True, False), [576, 586, 589, 585, 588]), ((200, (100, 1), 'single', True, True), [580, 588, 588, 590, 592]), ((200, (100, 1), 'double', True, False), [574, 580, 580, 584, 582]), ((200, (100, 1), 'double', True, True), [580, 589, 584, 584, 559]), ((200, (50, 1), 'single', True, False), [575, 583, 584, 587, 586]), ((200, (50, 1), 'single', True, True), [580, 590, 591, 590, 592]), ((200, (50, 1), 'double', True, False), [567, 584, 580, 585, 577]), ((200, (50, 1), 'double', True, True), [567, 564, 579, 581, 577]), ((1000, (200, 1), 'single', True, False), [6427, 6444, 6445, 6448, 6447]), ((1000, (200, 1), 'single', True, True), [6241, 6257, 6253, 6252, 6257]), ((1000, (200, 1), 'double', True, False), [3309, 3312, 3314, 3314, 3315]), ((1000, (200, 1), 'double', True, True), [3311, 3318, 3319, 3319, 3318]), ((1000, (10, 1), 'single', True, False), [4982, 4994, 4990, 4994, 4993]), ((1000, (10, 1), 'single', True, True), [4742, 4741, 4751, 4758, 4754]), ((1000, (10, 1), 'double', True, False), [3127, 3131, 3132, 3132, 3130]), ((1000, (10, 1), 'double', True, True), [3123, 3128, 3127, 3129, 3127]), ((1000, (100, 1), 'single', True, False), [6336, 6351, 6348, 6356, 6351]), ((1000, (100, 1), 'single', True, True), [6209, 6217, 6224, 6221, 6219]), ((1000, (100, 1), 'double', True, False), [3323, 3328, 3329, 3329, 3327]), ((1000, (100, 1), 'double', True, True), [3283, 3286, 3290, 3288, 3289]), ((1000, (50, 1), 'single', True, False), [6293, 6325, 6326, 6322, 6326]), ((1000, (50, 1), 'single', True, True), [6086, 6098, 6099, 6098, 6097]), ((1000, (50, 1), 'double', True, False), [3240, 3242, 3244, 3242, 3243]), ((1000, (50, 1), 'double', True, True), [3268, 3270, 3271, 3270, 3270]), ((400, (200, 1), 'single', True, False), [2263, 2306, 2308, 2309, 2289]), ((400, (200, 1), 'single', True, True), [2173, 2264, 2231, 2281, 2313]), ((400, (200, 1), 'double', True, False), [2178, 2182, 2203, 2217, 2205]), ((400, (200, 1), 'double', True, True), [2175, 2192, 2215, 2212, 2226]), ((400, (10, 1), 'single', True, False), [2256, 2263, 2298, 2263, 2313]), ((400, (10, 1), 'single', True, True), [2287, 2338, 2333, 2332, 2339]), ((400, (10, 1), 'double', True, False), [2091, 2180, 2310, 2238, 2259]), ((400, (10, 1), 'double', True, True), [2270, 2304, 2322, 2323, 2314]), ((400, (100, 1), 'single', True, False), [2288, 2325, 2317, 2336, 2331]), ((400, (100, 1), 'single', True, True), [2279, 2315, 2311, 2312, 2318]), ((400, (100, 1), 'double', True, False), [2252, 2313, 2304, 2307, 2315]), ((400, (100, 1), 'double', True, True), [2264, 2317, 2308, 2286, 2309]), ((400, (50, 1), 'single', True, False), [2287, 2318, 2323, 2290, 2317]), ((400, (50, 1), 'single', True, True), [2293, 2315, 2310, 2338, 2337]), ((400, (50, 1), 'double', True, False), [2219, 2221, 2254, 2241, 2291]), ((400, (50, 1), 'double', True, True), [2190, 2235, 2235, 2278, 2264]), ((50, (10, 1), 'single', True, False), [35, 35, 35, 36, 35]), ((50, (10, 1), 'single', True, True), [35, 35, 36, 34, 35]), ((50, (10, 1), 'double', True, False), [34, 35, 36, 35, 36]), ((50, (10, 1), 'double', True, True), [35, 35, 36, 35, 35]), ((50, (50, 1), 'single', True, False), [35, 35, 35, 35, 35]), ((50, (50, 1), 'single', True, True), [35, 36, 35, 36, 36]), ((50, (50, 1), 'double', True, False), [23, 35, 35, 36, 36]), ((50, (50, 1), 'double', True, True), [36, 36, 37, 37, 37]), ((600, (30, 1), 'single', True, False), [4954, 5102, 5105, 5124, 5087]), ((600, (30, 1), 'single', True, True), [5020, 5054, 5086, 5101, 5185]), ((600, (30, 1), 'double', True, False), [3248, 3262, 3260, 3266, 3267]), ((600, (30, 1), 'double', True, True), [3252, 3256, 3263, 3257, 3264]), ((600, (200, 1), 'single', True, False), [4971, 5053, 5097, 5096, 5112]), ((600, (200, 1), 'single', True, True), [4966, 5088, 5100, 5018, 5021]), ((600, (200, 1), 'double', True, False), [3290, 3302, 3301, 3299, 3299]), ((600, (200, 1), 'double', True, True), [3263, 3275, 3280, 3278, 3277]), ((600, (10, 1), 'single', True, False), [4619, 4642, 4647, 4649, 4646]), ((600, (10, 1), 'single', True, True), [4572, 4590, 4601, 4603, 4605]), ((600, (10, 1), 'double', True, False), [3097, 3105, 3105, 3102, 3106]), ((600, (10, 1), 'double', True, True), [3066, 3076, 3078, 3080, 3077]), ((600, (100, 1), 'single', True, False), [5016, 5028, 5093, 5074, 5115]), ((600, (100, 1), 'single', True, True), [4987, 5077, 5086, 5071, 5104]), ((600, (100, 1), 'double', True, False), [3272, 3281, 3283, 3280, 3284]), ((600, (100, 1), 'double', True, True), [3261, 3270, 3267, 3269, 3270]), ((600, (50, 1), 'single', True, False), [5111, 5171, 5223, 5173, 5189]), ((600, (50, 1), 'single', True, True), [5009, 5193, 5150, 5182, 5208]), ((600, (50, 1), 'double', True, False), [3260, 3275, 3275, 3274, 3273]), ((600, (50, 1), 'double', True, True), [3278, 3292, 3292, 3292, 3289]), ((800, (256, 1), 'single', True, True), [5997, 6011, 6023, 6018, 6022]), ((800, (256, 1), 'double', True, True), [3313, 3322, 3323, 3323, 3322]), ((800, (32, 1), 'single', True, True), [6180, 6208, 6215, 6204, 6208]), ((800, (32, 1), 'double', True, True), [3326, 3334, 3333, 3333, 3331]), ((800, (64, 1), 'single', True, True), [6233, 6262, 6267, 6262, 6258]), ((800, (64, 1), 'double', True, True), [3343, 3347, 3349, 3350, 3351]), ((800, (128, 1), 'single', True, True), [6341, 6364, 6365, 6363, 6364]), ((800, (128, 1), 'double', True, True), [3414, 3423, 3422, 3423, 3424]), ((800, (512, 1), 'single', True, True), [6005, 6023, 6024, 6033, 6026]), ((800, (512, 1), 'double', True, True), [3299, 3305, 3307, 3306, 3303]), ((800, (16, 1), 'single', True, True), [5707, 5729, 5732, 5729, 5731]), ((800, (16, 1), 'double', True, True), [3186, 3191, 3190, 3193, 3192]), ((100, (32, 1), 'single', True, True), [145, 147, 148, 147, 148]), ((100, (32, 1), 'double', True, True), [144, 146, 147, 146, 146]), ((100, (64, 1), 'single', True, True), [144, 146, 145, 147, 146]), ((100, (64, 1), 'double', True, True), [145, 147, 146, 147, 149]), ((100, (128, 1), 'single', True, True), [144, 146, 146, 147, 145]), ((100, (128, 1), 'double', True, True), [144, 147, 146, 146, 147]), ((100, (16, 1), 'single', True, True), [146, 148, 148, 149, 149]), ((100, (16, 1), 'double', True, True), [144, 146, 146, 147, 147]), ((200, (256, 1), 'single', True, True), [573, 587, 583, 586, 590]), ((200, (256, 1), 'double', True, True), [568, 572, 573, 575, 580]), ((200, (32, 1), 'single', True, True), [574, 582, 582, 586, 577]), ((200, (32, 1), 'double', True, True), [565, 580, 580, 581, 582]), ((200, (64, 1), 'single', True, True), [575, 581, 580, 582, 581]), ((200, (64, 1), 'double', True, True), [573, 581, 588, 584, 583]), ((200, (128, 1), 'single', True, True), [573, 579, 578, 587, 582]), ((200, (128, 1), 'double', True, True), [570, 577, 586, 582, 580]), ((200, (16, 1), 'single', True, True), [575, 556, 583, 573, 586]), ((200, (16, 1), 'double', True, True), [574, 586, 584, 588, 589]), ((1000, (256, 1), 'single', True, True), [6391, 6406, 6407, 6406, 6407]), ((1000, (256, 1), 'double', True, True), [3339, 3344, 3345, 3345, 3345]), ((1000, (32, 1), 'single', True, True), [6403, 6415, 6419, 6417, 6417]), ((1000, (32, 1), 'double', True, True), [3358, 3364, 3363, 3363, 3363]), ((1000, (64, 1), 'single', True, True), [6289, 6300, 6303, 6305, 6305]), ((1000, (64, 1), 'double', True, True), [3376, 3379, 3381, 3380, 3380]), ((1000, (128, 1), 'single', True, True), [6329, 6342, 6350, 6343, 6346]), ((1000, (128, 1), 'double', True, True), [3383, 3384, 3387, 3385, 3387]), ((1000, (512, 1), 'single', True, True), [6391, 6399, 6404, 6408, 6405]), ((1000, (512, 1), 'double', True, True), [3357, 3361, 3362, 3361, 3363]), ((1000, (1024, 1), 'single', True, True), [6379, 6397, 6398, 6404, 6398]), ((1000, (1024, 1), 'double', True, True), [3298, 3301, 3303, 3303, 3304]), ((1000, (16, 1), 'single', True, True), [5832, 5852, 5851, 5853, 5849]), ((1000, (16, 1), 'double', True, True), [3199, 3202, 3203, 3203, 3202]), ((400, (256, 1), 'single', True, True), [2051, 2073, 2081, 2086, 2096]), ((400, (256, 1), 'double', True, True), [2021, 2035, 2004, 2047, 2051]), ((400, (32, 1), 'single', True, True), [2059, 2082, 2083, 2087, 2081]), ((400, (32, 1), 'double', True, True), [2045, 2040, 2062, 2071, 2081]), ((400, (64, 1), 'single', True, True), [2039, 2068, 2073, 2078, 2074]), ((400, (64, 1), 'double', True, True), [2027, 2057, 2028, 2050, 2054]), ((400, (128, 1), 'single', True, True), [2053, 2098, 2095, 2091, 2075]), ((400, (128, 1), 'double', True, True), [2047, 2072, 2081, 2076, 2088]), ((400, (16, 1), 'single', True, True), [2066, 2099, 2100, 2098, 2099]), ((400, (16, 1), 'double', True, True), [2252, 2272, 2271, 2265, 2302]), ((50, (32, 1), 'single', True, True), [32, 32, 32, 33, 33]), ((50, (32, 1), 'double', True, True), [32, 33, 33, 33, 33]), ((50, (64, 1), 'single', True, True), [32, 32, 33, 33, 33]), ((50, (64, 1), 'double', True, True), [32, 32, 32, 33, 33]), ((50, (128, 1), 'single', True, True), [32, 33, 33, 33, 33]), ((50, (128, 1), 'double', True, True), [32, 32, 32, 32, 33]), ((50, (16, 1), 'single', True, True), [32, 33, 33, 33, 33]), ((50, (16, 1), 'double', True, True), [32, 32, 32, 33, 33]), ((600, (256, 1), 'single', True, True), [4500, 4626, 4605, 4612, 4621]), ((600, (256, 1), 'double', True, True), [3292, 3299, 3299, 3304, 3301]), ((600, (32, 1), 'single', True, True), [4631, 4671, 4693, 4696, 4703]), ((600, (32, 1), 'double', True, True), [3317, 3334, 3334, 3333, 3332]), ((600, (64, 1), 'single', True, True), [4537, 4599, 4598, 4608, 4602]), ((600, (64, 1), 'double', True, True), [3297, 3310, 3315, 3314, 3314]), ((600, (128, 1), 'single', True, True), [4416, 4624, 4635, 4638, 4658]), ((600, (128, 1), 'double', True, True), [3299, 3313, 3318, 3316, 3320]), ((600, (512, 1), 'single', True, True), [4473, 4503, 4548, 4544, 4520]), ((600, (512, 1), 'double', True, True), [3191, 3205, 3205, 3202, 3201]), ((600, (16, 1), 'single', True, True), [4618, 4683, 4657, 4669, 4680]), ((600, (16, 1), 'double', True, True), [3246, 3259, 3262, 3264, 3272])] diff --git a/result/ldc_3d_benchmark_P100.log b/result/ldc_3d_benchmark_P100.log index 0f3cb16..d1d2103 100644 --- a/result/ldc_3d_benchmark_P100.log +++ b/result/ldc_3d_benchmark_P100.log @@ -1,144 +1,300 @@ -(16, (16, 1, 1), 'symbolic.D3Q19', 'single', True): ~60 MLUPS -(16, (16, 1, 1), 'symbolic.D3Q19', 'single', False): ~57 MLUPS -(16, (16, 1, 1), 'symbolic.D3Q19', 'double', True): ~60 MLUPS -(16, (16, 1, 1), 'symbolic.D3Q19', 'double', False): ~57 MLUPS -(16, (16, 1, 1), 'symbolic.D3Q27', 'single', True): ~60 MLUPS -(16, (16, 1, 1), 'symbolic.D3Q27', 'single', False): ~57 MLUPS -(16, (16, 1, 1), 'symbolic.D3Q27', 'double', True): ~60 MLUPS -(16, (16, 1, 1), 'symbolic.D3Q27', 'double', False): ~57 MLUPS -(32, (16, 1, 1), 'symbolic.D3Q19', 'single', True): ~481 MLUPS -(32, (16, 1, 1), 'symbolic.D3Q19', 'single', False): ~462 MLUPS -(32, (16, 1, 1), 'symbolic.D3Q19', 'double', True): ~481 MLUPS -(32, (16, 1, 1), 'symbolic.D3Q19', 'double', False): ~413 MLUPS -(32, (16, 1, 1), 'symbolic.D3Q27', 'single', True): ~480 MLUPS -(32, (16, 1, 1), 'symbolic.D3Q27', 'single', False): ~454 MLUPS -(32, (16, 1, 1), 'symbolic.D3Q27', 'double', True): ~477 MLUPS -(32, (16, 1, 1), 'symbolic.D3Q27', 'double', False): ~266 MLUPS -(32, (32, 1, 1), 'symbolic.D3Q19', 'single', True): ~481 MLUPS -(32, (32, 1, 1), 'symbolic.D3Q19', 'single', False): ~476 MLUPS -(32, (32, 1, 1), 'symbolic.D3Q19', 'double', True): ~477 MLUPS -(32, (32, 1, 1), 'symbolic.D3Q19', 'double', False): ~474 MLUPS -(32, (32, 1, 1), 'symbolic.D3Q27', 'single', True): ~478 MLUPS -(32, (32, 1, 1), 'symbolic.D3Q27', 'single', False): ~482 MLUPS -(32, (32, 1, 1), 'symbolic.D3Q27', 'double', True): ~480 MLUPS -(32, (32, 1, 1), 'symbolic.D3Q27', 'double', False): ~426 MLUPS -(48, (16, 1, 1), 'symbolic.D3Q19', 'single', True): ~1609 MLUPS -(48, (16, 1, 1), 'symbolic.D3Q19', 'single', False): ~1250 MLUPS -(48, (16, 1, 1), 'symbolic.D3Q19', 'double', True): ~1428 MLUPS -(48, (16, 1, 1), 'symbolic.D3Q19', 'double', False): ~510 MLUPS -(48, (16, 1, 1), 'symbolic.D3Q27', 'single', True): ~1600 MLUPS -(48, (16, 1, 1), 'symbolic.D3Q27', 'single', False): ~776 MLUPS -(48, (16, 1, 1), 'symbolic.D3Q27', 'double', True): ~1010 MLUPS -(48, (16, 1, 1), 'symbolic.D3Q27', 'double', False): ~322 MLUPS -(48, (24, 1, 1), 'symbolic.D3Q19', 'single', True): ~1609 MLUPS -(48, (24, 1, 1), 'symbolic.D3Q19', 'single', False): ~1603 MLUPS -(48, (24, 1, 1), 'symbolic.D3Q19', 'double', True): ~1402 MLUPS -(48, (24, 1, 1), 'symbolic.D3Q19', 'double', False): ~718 MLUPS -(48, (24, 1, 1), 'symbolic.D3Q27', 'single', True): ~1634 MLUPS -(48, (24, 1, 1), 'symbolic.D3Q27', 'single', False): ~1030 MLUPS -(48, (24, 1, 1), 'symbolic.D3Q27', 'double', True): ~1006 MLUPS -(48, (24, 1, 1), 'symbolic.D3Q27', 'double', False): ~454 MLUPS -(48, (48, 1, 1), 'symbolic.D3Q19', 'single', True): ~1621 MLUPS -(48, (48, 1, 1), 'symbolic.D3Q19', 'single', False): ~1635 MLUPS -(48, (48, 1, 1), 'symbolic.D3Q19', 'double', True): ~1417 MLUPS -(48, (48, 1, 1), 'symbolic.D3Q19', 'double', False): ~724 MLUPS -(48, (48, 1, 1), 'symbolic.D3Q27', 'single', True): ~1617 MLUPS -(48, (48, 1, 1), 'symbolic.D3Q27', 'single', False): ~1046 MLUPS -(48, (48, 1, 1), 'symbolic.D3Q27', 'double', True): ~1022 MLUPS -(48, (48, 1, 1), 'symbolic.D3Q27', 'double', False): ~464 MLUPS -(64, (16, 1, 1), 'symbolic.D3Q19', 'single', True): ~2668 MLUPS -(64, (16, 1, 1), 'symbolic.D3Q19', 'single', False): ~1327 MLUPS -(64, (16, 1, 1), 'symbolic.D3Q19', 'double', True): ~1558 MLUPS -(64, (16, 1, 1), 'symbolic.D3Q19', 'double', False): ~517 MLUPS -(64, (16, 1, 1), 'symbolic.D3Q27', 'single', True): ~1793 MLUPS -(64, (16, 1, 1), 'symbolic.D3Q27', 'single', False): ~821 MLUPS -(64, (16, 1, 1), 'symbolic.D3Q27', 'double', True): ~1116 MLUPS -(64, (16, 1, 1), 'symbolic.D3Q27', 'double', False): ~327 MLUPS -(64, (32, 1, 1), 'symbolic.D3Q19', 'single', True): ~2817 MLUPS -(64, (32, 1, 1), 'symbolic.D3Q19', 'single', False): ~2295 MLUPS -(64, (32, 1, 1), 'symbolic.D3Q19', 'double', True): ~1560 MLUPS -(64, (32, 1, 1), 'symbolic.D3Q19', 'double', False): ~967 MLUPS -(64, (32, 1, 1), 'symbolic.D3Q27', 'single', True): ~1902 MLUPS -(64, (32, 1, 1), 'symbolic.D3Q27', 'single', False): ~1414 MLUPS -(64, (32, 1, 1), 'symbolic.D3Q27', 'double', True): ~1113 MLUPS -(64, (32, 1, 1), 'symbolic.D3Q27', 'double', False): ~610 MLUPS -(64, (64, 1, 1), 'symbolic.D3Q19', 'single', True): ~2737 MLUPS -(64, (64, 1, 1), 'symbolic.D3Q19', 'single', False): ~2314 MLUPS -(64, (64, 1, 1), 'symbolic.D3Q19', 'double', True): ~1561 MLUPS -(64, (64, 1, 1), 'symbolic.D3Q19', 'double', False): ~970 MLUPS -(64, (64, 1, 1), 'symbolic.D3Q27', 'single', True): ~1883 MLUPS -(64, (64, 1, 1), 'sy