NE10/FFT/complex-non-power-of-2 NEON v1.2.0
authorPhil.Wang <phil.wang@arm.com>
Wed, 17 Dec 2014 03:52:11 +0000 (11:52 +0800)
committerPhil.Wang <phil.wang@arm.com>
Thu, 18 Dec 2014 08:13:52 +0000 (16:13 +0800)
commit20b1896fd6532336e6a46608778bd6e0396dc4dc
tree541f4cd17b066b2fd845c9f9b3468134fbc98598
parent46b1da15cd3b7851dca5868b288d0fce323c3a58
NE10/FFT/complex-non-power-of-2 NEON

    ARM 64-bit (Cortex-A57)
    complex forward float LLVM 3.5
             Time in ms      |
        |kiss|opus|pffft|NE10|
        |   C|   C| NEON|NEON|
      60| 129| 113|   NA|  44|
     120| 148| 127|   NA|  49|
     240| 151| 128|   55|  47|
     480| 169| 142|   60|  55|
     960| 183| 149|   65|  58|
    1920| 193| 167|   71|  66|
    3840| 217| 175|   76|  71|
    SNR > 100dB

    ARM 64-bit (Cortex-A53)
    complex forward float LLVM 3.5
             Time in ms      |
        |kiss|opus|pffft|NE10|
        |   C|   C| NEON|NEON|
      60| 295| 311|   NA|  72|
     120| 368| 375|   NA|  79|
     240| 345| 342|  104|  77|
     480| 415| 407|  115|  87|
     960| 406| 378|  121|  95|
    1920| 476| 441|  138| 113|
    3840| 497| 424|  161| 126|
    SNR > 100dB

    ARM 32-bit (Cortex-A9)
    complex forward float LLVM 3.5
             Time in ms      |
        |kiss|opus|pffft|NE10|
        |   C|   C| NEON|NEON|
      60| 224| 211|   NA|  98|
     120| 265| 245|   NA| 104|
     240| 262| 240|  130| 106|
     480| 302| 274|  150| 122|
     960| 305| 271|  162| 153|
    1920| 369| 356|  230| 206|
    3840| 415| 440|  282| 239|
    SNR > 100dB

Change-Id: If9418041b01eed49dbdc8d6a18dd03f2c5684da8
21 files changed:
CMakeLists.txt
inc/NE10_dsp.h
inc/NE10_types.h
modules/CMakeLists.txt
modules/dsp/NE10_fft.c
modules/dsp/NE10_fft.h
modules/dsp/NE10_fft.neonintrinsic.h
modules/dsp/NE10_fft_cplx_ops.h
modules/dsp/NE10_fft_float32.c
modules/dsp/NE10_fft_float32.neon.c
modules/dsp/NE10_fft_float32.neonintrinsic.c
modules/dsp/NE10_fft_generic_float32.c
modules/dsp/NE10_fft_generic_float32.h [new file with mode: 0644]
modules/dsp/NE10_fft_generic_float32.neonintrinsic.cpp [new file with mode: 0644]
modules/dsp/NE10_fft_int16.c
modules/dsp/NE10_fft_int32.c
modules/dsp/NE10_fft_int32.neon.c
modules/dsp/NE10_fft_int32.neonintrinsic.c
modules/dsp/NE10_init_dsp.c
modules/dsp/NE10_rfft_float32.c
modules/dsp/test/test_suite_fft_float32.c