diff options
author | Nick Kurshev <nickols_k@mail.ru> | 2002-01-20 14:48:02 +0000 |
---|---|---|
committer | Nick Kurshev <nickols_k@mail.ru> | 2002-01-20 14:48:02 +0000 |
commit | 1e98dffb7aa4b4681ecc7949e7ad58acc80ad86a (patch) | |
tree | eda5315707572d48e2f75e55cd210254068fea18 /libavcodec/alpha/pixops.h | |
parent | 4bdd9157cc0b06c7001cb93e5cdd6304306253c4 (diff) | |
download | ffmpeg-1e98dffb7aa4b4681ecc7949e7ad58acc80ad86a.tar.gz |
Alpha optimizations by Falk Hueffner <falk.hueffner@student.uni-tuebingen.de>
Originally committed as revision 274 to svn://svn.ffmpeg.org/ffmpeg/trunk
Diffstat (limited to 'libavcodec/alpha/pixops.h')
-rw-r--r-- | libavcodec/alpha/pixops.h | 135 |
1 files changed, 135 insertions, 0 deletions
diff --git a/libavcodec/alpha/pixops.h b/libavcodec/alpha/pixops.h new file mode 100644 index 0000000000..7ae72ed779 --- /dev/null +++ b/libavcodec/alpha/pixops.h @@ -0,0 +1,135 @@ +/* + * Alpha optimized DSP utils + * Copyright (c) 2002 Falk Hueffner <falk@debian.org> + * + * This program is free software; you can redistribute it and/or modify + * it under the terms of the GNU General Public License as published by + * the Free Software Foundation; either version 2 of the License, or + * (at your option) any later version. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program; if not, write to the Free Software + * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. + */ + +/* This file is intended to be #included with proper definitions of + * PIXOPNAME, BTYPE, AVG2, AVG4 and STORE. */ + +static void PIXOPNAME(_pixels_axp)(BTYPE *block, const UINT8 *pixels, + int line_size, int h) +{ + if ((size_t) pixels & 0x7) { + do { + STORE(uldq(pixels), block); + pixels += line_size; + block += line_size; + } while (--h); + } else { + do { + STORE(ldq(pixels), block); + pixels += line_size; + block += line_size; + } while (--h); + } +} + +static void PIXOPNAME(_pixels_x2_axp)(BTYPE *block, const UINT8 *pixels, + int line_size, int h) +{ + if ((size_t) pixels & 0x7) { + do { + UINT64 pix1, pix2; + + pix1 = uldq(pixels); + pix2 = pix1 >> 8 | ((UINT64) pixels[8] << 56); + STORE(AVG2(pix1, pix2), block); + pixels += line_size; + block += line_size; + } while (--h); + } else { + do { + UINT64 pix1, pix2; + + pix1 = ldq(pixels); + pix2 = pix1 >> 8 | ((UINT64) pixels[8] << 56); + STORE(AVG2(pix1, pix2), block); + pixels += line_size; + block += line_size; + } while (--h); + } +} + +static void PIXOPNAME(_pixels_y2_axp)(BTYPE *block, const UINT8 *pixels, + int line_size, int h) +{ + if ((size_t) pixels & 0x7) { + UINT64 pix = uldq(pixels); + do { + UINT64 next_pix; + + pixels += line_size; + next_pix = uldq(pixels); + STORE(AVG2(pix, next_pix), block); + block += line_size; + pix = next_pix; + } while (--h); + } else { + UINT64 pix = ldq(pixels); + do { + UINT64 next_pix; + + pixels += line_size; + next_pix = ldq(pixels); + STORE(AVG2(pix, next_pix), block); + block += line_size; + pix = next_pix; + } while (--h); + } +} + +/* This could be further sped up by recycling AVG4 intermediate + results from the previous loop pass. */ +static void PIXOPNAME(_pixels_xy2_axp)(BTYPE *block, const UINT8 *pixels, + int line_size, int h) +{ + if ((size_t) pixels & 0x7) { + UINT64 pix1 = uldq(pixels); + UINT64 pix2 = pix1 >> 8 | ((UINT64) pixels[8] << 56); + + do { + UINT64 next_pix1, next_pix2; + + pixels += line_size; + next_pix1 = uldq(pixels); + next_pix2 = next_pix1 >> 8 | ((UINT64) pixels[8] << 56); + + STORE(AVG4(pix1, pix2, next_pix1, next_pix2), block); + + block += line_size; + pix1 = next_pix1; + pix2 = next_pix2; + } while (--h); + } else { + UINT64 pix1 = ldq(pixels); + UINT64 pix2 = pix1 >> 8 | ((UINT64) pixels[8] << 56); + + do { + UINT64 next_pix1, next_pix2; + + pixels += line_size; + next_pix1 = ldq(pixels); + next_pix2 = next_pix1 >> 8 | ((UINT64) pixels[8] << 56); + + STORE(AVG4(pix1, pix2, next_pix1, next_pix2), block); + + block += line_size; + pix1 = next_pix1; + pix2 = next_pix2; + } while (--h); + } +} |