1/* 2 * This file is part of FFmpeg. 3 * 4 * FFmpeg is free software; you can redistribute it and/or 5 * modify it under the terms of the GNU Lesser General Public 6 * License as published by the Free Software Foundation; either 7 * version 2.1 of the License, or (at your option) any later version. 8 * 9 * FFmpeg is distributed in the hope that it will be useful, 10 * but WITHOUT ANY WARRANTY; without even the implied warranty of 11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 12 * Lesser General Public License for more details. 13 * 14 * You should have received a copy of the GNU Lesser General Public 15 * License along with FFmpeg; if not, write to the Free Software 16 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA 17 */ 18 19#include <stdint.h> 20 21#include "config.h" 22#include "libavutil/attributes.h" 23#include "libavutil/cpu.h" 24#include "libavutil/x86/cpu.h" 25#include "libavcodec/h264chroma.h" 26 27void ff_put_h264_chroma_mc8_rnd_mmx (uint8_t *dst, uint8_t *src, 28 int stride, int h, int x, int y); 29void ff_avg_h264_chroma_mc8_rnd_mmxext(uint8_t *dst, uint8_t *src, 30 int stride, int h, int x, int y); 31void ff_avg_h264_chroma_mc8_rnd_3dnow(uint8_t *dst, uint8_t *src, 32 int stride, int h, int x, int y); 33 34void ff_put_h264_chroma_mc4_mmx (uint8_t *dst, uint8_t *src, 35 int stride, int h, int x, int y); 36void ff_avg_h264_chroma_mc4_mmxext (uint8_t *dst, uint8_t *src, 37 int stride, int h, int x, int y); 38void ff_avg_h264_chroma_mc4_3dnow (uint8_t *dst, uint8_t *src, 39 int stride, int h, int x, int y); 40 41void ff_put_h264_chroma_mc2_mmxext (uint8_t *dst, uint8_t *src, 42 int stride, int h, int x, int y); 43void ff_avg_h264_chroma_mc2_mmxext (uint8_t *dst, uint8_t *src, 44 int stride, int h, int x, int y); 45 46void ff_put_h264_chroma_mc8_rnd_ssse3(uint8_t *dst, uint8_t *src, 47 int stride, int h, int x, int y); 48void ff_put_h264_chroma_mc4_ssse3 (uint8_t *dst, uint8_t *src, 49 int stride, int h, int x, int y); 50 51void ff_avg_h264_chroma_mc8_rnd_ssse3(uint8_t *dst, uint8_t *src, 52 int stride, int h, int x, int y); 53void ff_avg_h264_chroma_mc4_ssse3 (uint8_t *dst, uint8_t *src, 54 int stride, int h, int x, int y); 55 56#define CHROMA_MC(OP, NUM, DEPTH, OPT) \ 57void ff_ ## OP ## _h264_chroma_mc ## NUM ## _ ## DEPTH ## _ ## OPT \ 58 (uint8_t *dst, uint8_t *src, \ 59 int stride, int h, int x, int y); 60 61CHROMA_MC(put, 2, 10, mmxext) 62CHROMA_MC(avg, 2, 10, mmxext) 63CHROMA_MC(put, 4, 10, mmxext) 64CHROMA_MC(avg, 4, 10, mmxext) 65CHROMA_MC(put, 8, 10, sse2) 66CHROMA_MC(avg, 8, 10, sse2) 67CHROMA_MC(put, 8, 10, avx) 68CHROMA_MC(avg, 8, 10, avx) 69 70av_cold void ff_h264chroma_init_x86(H264ChromaContext *c, int bit_depth) 71{ 72 int high_bit_depth = bit_depth > 8; 73 int cpu_flags = av_get_cpu_flags(); 74 75 if (EXTERNAL_MMX(cpu_flags) && !high_bit_depth) { 76 c->put_h264_chroma_pixels_tab[0] = ff_put_h264_chroma_mc8_rnd_mmx; 77 c->put_h264_chroma_pixels_tab[1] = ff_put_h264_chroma_mc4_mmx; 78 } 79 80 if (EXTERNAL_AMD3DNOW(cpu_flags) && !high_bit_depth) { 81 c->avg_h264_chroma_pixels_tab[0] = ff_avg_h264_chroma_mc8_rnd_3dnow; 82 c->avg_h264_chroma_pixels_tab[1] = ff_avg_h264_chroma_mc4_3dnow; 83 } 84 85 if (EXTERNAL_MMXEXT(cpu_flags) && !high_bit_depth) { 86 c->avg_h264_chroma_pixels_tab[0] = ff_avg_h264_chroma_mc8_rnd_mmxext; 87 c->avg_h264_chroma_pixels_tab[1] = ff_avg_h264_chroma_mc4_mmxext; 88 c->avg_h264_chroma_pixels_tab[2] = ff_avg_h264_chroma_mc2_mmxext; 89 c->put_h264_chroma_pixels_tab[2] = ff_put_h264_chroma_mc2_mmxext; 90 } 91 92 if (EXTERNAL_MMXEXT(cpu_flags) && bit_depth > 8 && bit_depth <= 10) { 93 c->put_h264_chroma_pixels_tab[2] = ff_put_h264_chroma_mc2_10_mmxext; 94 c->avg_h264_chroma_pixels_tab[2] = ff_avg_h264_chroma_mc2_10_mmxext; 95 c->put_h264_chroma_pixels_tab[1] = ff_put_h264_chroma_mc4_10_mmxext; 96 c->avg_h264_chroma_pixels_tab[1] = ff_avg_h264_chroma_mc4_10_mmxext; 97 } 98 99 if (EXTERNAL_SSE2(cpu_flags) && bit_depth > 8 && bit_depth <= 10) { 100 c->put_h264_chroma_pixels_tab[0] = ff_put_h264_chroma_mc8_10_sse2; 101 c->avg_h264_chroma_pixels_tab[0] = ff_avg_h264_chroma_mc8_10_sse2; 102 } 103 104 if (EXTERNAL_SSSE3(cpu_flags) && !high_bit_depth) { 105 c->put_h264_chroma_pixels_tab[0] = ff_put_h264_chroma_mc8_rnd_ssse3; 106 c->avg_h264_chroma_pixels_tab[0] = ff_avg_h264_chroma_mc8_rnd_ssse3; 107 c->put_h264_chroma_pixels_tab[1] = ff_put_h264_chroma_mc4_ssse3; 108 c->avg_h264_chroma_pixels_tab[1] = ff_avg_h264_chroma_mc4_ssse3; 109 } 110 111 if (EXTERNAL_AVX(cpu_flags) && bit_depth > 8 && bit_depth <= 10) { 112 // AVX implies !cache64. 113 // TODO: Port cache(32|64) detection from x264. 114 c->put_h264_chroma_pixels_tab[0] = ff_put_h264_chroma_mc8_10_avx; 115 c->avg_h264_chroma_pixels_tab[0] = ff_avg_h264_chroma_mc8_10_avx; 116 } 117} 118