[981e22c] | 1 | /********************************************************************* |
---|
| 2 | Blosc - Blocked Shuffling and Compression Library |
---|
| 3 | |
---|
| 4 | Author: Francesc Alted <[email protected]> |
---|
| 5 | |
---|
| 6 | See LICENSES/BLOSC.txt for details about copyright and rights to use. |
---|
| 7 | **********************************************************************/ |
---|
| 8 | |
---|
| 9 | /* Generic (non-hardware-accelerated) shuffle/unshuffle routines. |
---|
| 10 | These are used when hardware-accelerated functions aren't available |
---|
| 11 | for a particular platform; they are also used by the hardware- |
---|
| 12 | accelerated functions to handle any remaining elements in a block |
---|
| 13 | which isn't a multiple of the hardware's vector size. */ |
---|
| 14 | |
---|
| 15 | #ifndef SHUFFLE_GENERIC_H |
---|
| 16 | #define SHUFFLE_GENERIC_H |
---|
| 17 | |
---|
| 18 | #include "shuffle-common.h" |
---|
| 19 | #include <stdlib.h> |
---|
| 20 | |
---|
| 21 | #ifdef __cplusplus |
---|
| 22 | extern "C" { |
---|
| 23 | #endif |
---|
| 24 | |
---|
| 25 | /** |
---|
| 26 | Generic (non-hardware-accelerated) shuffle routine. |
---|
| 27 | This is the pure element-copying nested loop. It is used by the |
---|
| 28 | generic shuffle implementation and also by the vectorized shuffle |
---|
| 29 | implementations to process any remaining elements in a block which |
---|
| 30 | is not a multiple of (type_size * vector_size). |
---|
| 31 | */ |
---|
| 32 | static void shuffle_generic_inline(const size_t type_size, |
---|
| 33 | const size_t vectorizable_blocksize, const size_t blocksize, |
---|
| 34 | const uint8_t* const _src, uint8_t* const _dest) |
---|
| 35 | { |
---|
| 36 | size_t i, j; |
---|
| 37 | /* Calculate the number of elements in the block. */ |
---|
| 38 | const size_t neblock_quot = blocksize / type_size; |
---|
| 39 | const size_t neblock_rem = blocksize % type_size; |
---|
| 40 | const size_t vectorizable_elements = vectorizable_blocksize / type_size; |
---|
| 41 | |
---|
| 42 | |
---|
| 43 | /* Non-optimized shuffle */ |
---|
| 44 | for (j = 0; j < type_size; j++) { |
---|
| 45 | for (i = vectorizable_elements; i < (size_t)neblock_quot; i++) { |
---|
| 46 | _dest[j*neblock_quot+i] = _src[i*type_size+j]; |
---|
| 47 | } |
---|
| 48 | } |
---|
| 49 | |
---|
| 50 | /* Copy any leftover bytes in the block without shuffling them. */ |
---|
| 51 | memcpy(_dest + (blocksize - neblock_rem), _src + (blocksize - neblock_rem), neblock_rem); |
---|
| 52 | } |
---|
| 53 | |
---|
| 54 | /** |
---|
| 55 | Generic (non-hardware-accelerated) unshuffle routine. |
---|
| 56 | This is the pure element-copying nested loop. It is used by the |
---|
| 57 | generic unshuffle implementation and also by the vectorized unshuffle |
---|
| 58 | implementations to process any remaining elements in a block which |
---|
| 59 | is not a multiple of (type_size * vector_size). |
---|
| 60 | */ |
---|
| 61 | static void unshuffle_generic_inline(const size_t type_size, |
---|
| 62 | const size_t vectorizable_blocksize, const size_t blocksize, |
---|
| 63 | const uint8_t* const _src, uint8_t* const _dest) |
---|
| 64 | { |
---|
| 65 | size_t i, j; |
---|
| 66 | |
---|
| 67 | /* Calculate the number of elements in the block. */ |
---|
| 68 | const size_t neblock_quot = blocksize / type_size; |
---|
| 69 | const size_t neblock_rem = blocksize % type_size; |
---|
| 70 | const size_t vectorizable_elements = vectorizable_blocksize / type_size; |
---|
| 71 | |
---|
| 72 | /* Non-optimized unshuffle */ |
---|
| 73 | for (i = vectorizable_elements; i < (size_t)neblock_quot; i++) { |
---|
| 74 | for (j = 0; j < type_size; j++) { |
---|
| 75 | _dest[i*type_size+j] = _src[j*neblock_quot+i]; |
---|
| 76 | } |
---|
| 77 | } |
---|
| 78 | |
---|
| 79 | /* Copy any leftover bytes in the block without unshuffling them. */ |
---|
| 80 | memcpy(_dest + (blocksize - neblock_rem), _src + (blocksize - neblock_rem), neblock_rem); |
---|
| 81 | } |
---|
| 82 | |
---|
| 83 | /** |
---|
| 84 | Generic (non-hardware-accelerated) shuffle routine. |
---|
| 85 | */ |
---|
| 86 | BLOSC_NO_EXPORT void shuffle_generic(const size_t bytesoftype, const size_t blocksize, |
---|
| 87 | const uint8_t* const _src, uint8_t* const _dest); |
---|
| 88 | |
---|
| 89 | /** |
---|
| 90 | Generic (non-hardware-accelerated) unshuffle routine. |
---|
| 91 | */ |
---|
| 92 | BLOSC_NO_EXPORT void unshuffle_generic(const size_t bytesoftype, const size_t blocksize, |
---|
| 93 | const uint8_t* const _src, uint8_t* const _dest); |
---|
| 94 | |
---|
| 95 | #ifdef __cplusplus |
---|
| 96 | } |
---|
| 97 | #endif |
---|
| 98 | |
---|
| 99 | #endif /* SHUFFLE_GENERIC_H */ |
---|