annotate ffmpeg/libavcodec/x86/h264chroma_init.c @ 13:844d341cf643 tip

Back up before ISMIR
author Yading Song <yading.song@eecs.qmul.ac.uk>
date Thu, 31 Oct 2013 13:17:06 +0000
parents 6840f77b83aa
children
rev   line source
yading@10 1 /*
yading@10 2 * This file is part of FFmpeg.
yading@10 3 *
yading@10 4 * FFmpeg is free software; you can redistribute it and/or
yading@10 5 * modify it under the terms of the GNU Lesser General Public
yading@10 6 * License as published by the Free Software Foundation; either
yading@10 7 * version 2.1 of the License, or (at your option) any later version.
yading@10 8 *
yading@10 9 * FFmpeg is distributed in the hope that it will be useful,
yading@10 10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
yading@10 11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
yading@10 12 * Lesser General Public License for more details.
yading@10 13 *
yading@10 14 * You should have received a copy of the GNU Lesser General Public
yading@10 15 * License along with FFmpeg; if not, write to the Free Software
yading@10 16 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
yading@10 17 */
yading@10 18
yading@10 19 #include <stdint.h>
yading@10 20
yading@10 21 #include "config.h"
yading@10 22 #include "libavutil/cpu.h"
yading@10 23 #include "libavutil/x86/cpu.h"
yading@10 24 #include "libavcodec/h264chroma.h"
yading@10 25
yading@10 26 void ff_put_h264_chroma_mc8_rnd_mmx (uint8_t *dst, uint8_t *src,
yading@10 27 int stride, int h, int x, int y);
yading@10 28 void ff_avg_h264_chroma_mc8_rnd_mmxext(uint8_t *dst, uint8_t *src,
yading@10 29 int stride, int h, int x, int y);
yading@10 30 void ff_avg_h264_chroma_mc8_rnd_3dnow(uint8_t *dst, uint8_t *src,
yading@10 31 int stride, int h, int x, int y);
yading@10 32
yading@10 33 void ff_put_h264_chroma_mc4_mmx (uint8_t *dst, uint8_t *src,
yading@10 34 int stride, int h, int x, int y);
yading@10 35 void ff_avg_h264_chroma_mc4_mmxext (uint8_t *dst, uint8_t *src,
yading@10 36 int stride, int h, int x, int y);
yading@10 37 void ff_avg_h264_chroma_mc4_3dnow (uint8_t *dst, uint8_t *src,
yading@10 38 int stride, int h, int x, int y);
yading@10 39
yading@10 40 void ff_put_h264_chroma_mc2_mmxext (uint8_t *dst, uint8_t *src,
yading@10 41 int stride, int h, int x, int y);
yading@10 42 void ff_avg_h264_chroma_mc2_mmxext (uint8_t *dst, uint8_t *src,
yading@10 43 int stride, int h, int x, int y);
yading@10 44
yading@10 45 void ff_put_h264_chroma_mc8_rnd_ssse3(uint8_t *dst, uint8_t *src,
yading@10 46 int stride, int h, int x, int y);
yading@10 47 void ff_put_h264_chroma_mc4_ssse3 (uint8_t *dst, uint8_t *src,
yading@10 48 int stride, int h, int x, int y);
yading@10 49
yading@10 50 void ff_avg_h264_chroma_mc8_rnd_ssse3(uint8_t *dst, uint8_t *src,
yading@10 51 int stride, int h, int x, int y);
yading@10 52 void ff_avg_h264_chroma_mc4_ssse3 (uint8_t *dst, uint8_t *src,
yading@10 53 int stride, int h, int x, int y);
yading@10 54
yading@10 55 #define CHROMA_MC(OP, NUM, DEPTH, OPT) \
yading@10 56 void ff_ ## OP ## _h264_chroma_mc ## NUM ## _ ## DEPTH ## _ ## OPT \
yading@10 57 (uint8_t *dst, uint8_t *src, \
yading@10 58 int stride, int h, int x, int y);
yading@10 59
yading@10 60 CHROMA_MC(put, 2, 10, mmxext)
yading@10 61 CHROMA_MC(avg, 2, 10, mmxext)
yading@10 62 CHROMA_MC(put, 4, 10, mmxext)
yading@10 63 CHROMA_MC(avg, 4, 10, mmxext)
yading@10 64 CHROMA_MC(put, 8, 10, sse2)
yading@10 65 CHROMA_MC(avg, 8, 10, sse2)
yading@10 66 CHROMA_MC(put, 8, 10, avx)
yading@10 67 CHROMA_MC(avg, 8, 10, avx)
yading@10 68
yading@10 69 void ff_h264chroma_init_x86(H264ChromaContext *c, int bit_depth)
yading@10 70 {
yading@10 71 #if HAVE_YASM
yading@10 72 int high_bit_depth = bit_depth > 8;
yading@10 73 int mm_flags = av_get_cpu_flags();
yading@10 74
yading@10 75 if (EXTERNAL_MMX(mm_flags) && !high_bit_depth) {
yading@10 76 c->put_h264_chroma_pixels_tab[0] = ff_put_h264_chroma_mc8_rnd_mmx;
yading@10 77 c->put_h264_chroma_pixels_tab[1] = ff_put_h264_chroma_mc4_mmx;
yading@10 78 }
yading@10 79
yading@10 80 if (EXTERNAL_AMD3DNOW(mm_flags) && !high_bit_depth) {
yading@10 81 c->avg_h264_chroma_pixels_tab[0] = ff_avg_h264_chroma_mc8_rnd_3dnow;
yading@10 82 c->avg_h264_chroma_pixels_tab[1] = ff_avg_h264_chroma_mc4_3dnow;
yading@10 83 }
yading@10 84
yading@10 85 if (EXTERNAL_MMXEXT(mm_flags) && !high_bit_depth) {
yading@10 86 c->avg_h264_chroma_pixels_tab[0] = ff_avg_h264_chroma_mc8_rnd_mmxext;
yading@10 87 c->avg_h264_chroma_pixels_tab[1] = ff_avg_h264_chroma_mc4_mmxext;
yading@10 88 c->avg_h264_chroma_pixels_tab[2] = ff_avg_h264_chroma_mc2_mmxext;
yading@10 89 c->put_h264_chroma_pixels_tab[2] = ff_put_h264_chroma_mc2_mmxext;
yading@10 90 }
yading@10 91
yading@10 92 if (EXTERNAL_MMXEXT(mm_flags) && bit_depth > 8 && bit_depth <= 10) {
yading@10 93 c->put_h264_chroma_pixels_tab[2] = ff_put_h264_chroma_mc2_10_mmxext;
yading@10 94 c->avg_h264_chroma_pixels_tab[2] = ff_avg_h264_chroma_mc2_10_mmxext;
yading@10 95 c->put_h264_chroma_pixels_tab[1] = ff_put_h264_chroma_mc4_10_mmxext;
yading@10 96 c->avg_h264_chroma_pixels_tab[1] = ff_avg_h264_chroma_mc4_10_mmxext;
yading@10 97 }
yading@10 98
yading@10 99 if (EXTERNAL_SSE2(mm_flags) && bit_depth > 8 && bit_depth <= 10) {
yading@10 100 c->put_h264_chroma_pixels_tab[0] = ff_put_h264_chroma_mc8_10_sse2;
yading@10 101 c->avg_h264_chroma_pixels_tab[0] = ff_avg_h264_chroma_mc8_10_sse2;
yading@10 102 }
yading@10 103
yading@10 104 if (EXTERNAL_SSSE3(mm_flags) && !high_bit_depth) {
yading@10 105 c->put_h264_chroma_pixels_tab[0] = ff_put_h264_chroma_mc8_rnd_ssse3;
yading@10 106 c->avg_h264_chroma_pixels_tab[0] = ff_avg_h264_chroma_mc8_rnd_ssse3;
yading@10 107 c->put_h264_chroma_pixels_tab[1] = ff_put_h264_chroma_mc4_ssse3;
yading@10 108 c->avg_h264_chroma_pixels_tab[1] = ff_avg_h264_chroma_mc4_ssse3;
yading@10 109 }
yading@10 110
yading@10 111 if (EXTERNAL_AVX(mm_flags) && bit_depth > 8 && bit_depth <= 10) {
yading@10 112 // AVX implies !cache64.
yading@10 113 // TODO: Port cache(32|64) detection from x264.
yading@10 114 c->put_h264_chroma_pixels_tab[0] = ff_put_h264_chroma_mc8_10_avx;
yading@10 115 c->avg_h264_chroma_pixels_tab[0] = ff_avg_h264_chroma_mc8_10_avx;
yading@10 116 }
yading@10 117 #endif
yading@10 118 }