2
* This file is part of Libav.
4
* Libav is free software; you can redistribute it and/or
5
* modify it under the terms of the GNU Lesser General Public
6
* License as published by the Free Software Foundation; either
7
* version 2.1 of the License, or (at your option) any later version.
9
* Libav is distributed in the hope that it will be useful,
10
* but WITHOUT ANY WARRANTY; without even the implied warranty of
11
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12
* Lesser General Public License for more details.
14
* You should have received a copy of the GNU Lesser General Public
15
* License along with Libav; if not, write to the Free Software
16
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
22
#include "libavutil/attributes.h"
23
#include "libavutil/cpu.h"
24
#include "libavutil/x86/cpu.h"
25
#include "libavcodec/h264chroma.h"
27
void ff_put_h264_chroma_mc8_rnd_mmx (uint8_t *dst, uint8_t *src,
28
int stride, int h, int x, int y);
29
void ff_avg_h264_chroma_mc8_rnd_mmxext(uint8_t *dst, uint8_t *src,
30
int stride, int h, int x, int y);
31
void ff_avg_h264_chroma_mc8_rnd_3dnow(uint8_t *dst, uint8_t *src,
32
int stride, int h, int x, int y);
34
void ff_put_h264_chroma_mc4_mmx (uint8_t *dst, uint8_t *src,
35
int stride, int h, int x, int y);
36
void ff_avg_h264_chroma_mc4_mmxext (uint8_t *dst, uint8_t *src,
37
int stride, int h, int x, int y);
38
void ff_avg_h264_chroma_mc4_3dnow (uint8_t *dst, uint8_t *src,
39
int stride, int h, int x, int y);
41
void ff_put_h264_chroma_mc2_mmxext (uint8_t *dst, uint8_t *src,
42
int stride, int h, int x, int y);
43
void ff_avg_h264_chroma_mc2_mmxext (uint8_t *dst, uint8_t *src,
44
int stride, int h, int x, int y);
46
void ff_put_h264_chroma_mc8_rnd_ssse3(uint8_t *dst, uint8_t *src,
47
int stride, int h, int x, int y);
48
void ff_put_h264_chroma_mc4_ssse3 (uint8_t *dst, uint8_t *src,
49
int stride, int h, int x, int y);
51
void ff_avg_h264_chroma_mc8_rnd_ssse3(uint8_t *dst, uint8_t *src,
52
int stride, int h, int x, int y);
53
void ff_avg_h264_chroma_mc4_ssse3 (uint8_t *dst, uint8_t *src,
54
int stride, int h, int x, int y);
56
#define CHROMA_MC(OP, NUM, DEPTH, OPT) \
57
void ff_ ## OP ## _h264_chroma_mc ## NUM ## _ ## DEPTH ## _ ## OPT \
58
(uint8_t *dst, uint8_t *src, \
59
int stride, int h, int x, int y);
61
CHROMA_MC(put, 2, 10, mmxext)
62
CHROMA_MC(avg, 2, 10, mmxext)
63
CHROMA_MC(put, 4, 10, mmxext)
64
CHROMA_MC(avg, 4, 10, mmxext)
65
CHROMA_MC(put, 8, 10, sse2)
66
CHROMA_MC(avg, 8, 10, sse2)
67
CHROMA_MC(put, 8, 10, avx)
68
CHROMA_MC(avg, 8, 10, avx)
70
av_cold void ff_h264chroma_init_x86(H264ChromaContext *c, int bit_depth)
73
int high_bit_depth = bit_depth > 8;
74
int cpu_flags = av_get_cpu_flags();
76
if (EXTERNAL_MMX(cpu_flags) && !high_bit_depth) {
77
c->put_h264_chroma_pixels_tab[0] = ff_put_h264_chroma_mc8_rnd_mmx;
78
c->put_h264_chroma_pixels_tab[1] = ff_put_h264_chroma_mc4_mmx;
81
if (EXTERNAL_AMD3DNOW(cpu_flags) && !high_bit_depth) {
82
c->avg_h264_chroma_pixels_tab[0] = ff_avg_h264_chroma_mc8_rnd_3dnow;
83
c->avg_h264_chroma_pixels_tab[1] = ff_avg_h264_chroma_mc4_3dnow;
86
if (EXTERNAL_MMXEXT(cpu_flags) && !high_bit_depth) {
87
c->avg_h264_chroma_pixels_tab[0] = ff_avg_h264_chroma_mc8_rnd_mmxext;
88
c->avg_h264_chroma_pixels_tab[1] = ff_avg_h264_chroma_mc4_mmxext;
89
c->avg_h264_chroma_pixels_tab[2] = ff_avg_h264_chroma_mc2_mmxext;
90
c->put_h264_chroma_pixels_tab[2] = ff_put_h264_chroma_mc2_mmxext;
93
if (EXTERNAL_MMXEXT(cpu_flags) && bit_depth > 8 && bit_depth <= 10) {
94
c->put_h264_chroma_pixels_tab[2] = ff_put_h264_chroma_mc2_10_mmxext;
95
c->avg_h264_chroma_pixels_tab[2] = ff_avg_h264_chroma_mc2_10_mmxext;
96
c->put_h264_chroma_pixels_tab[1] = ff_put_h264_chroma_mc4_10_mmxext;
97
c->avg_h264_chroma_pixels_tab[1] = ff_avg_h264_chroma_mc4_10_mmxext;
100
if (EXTERNAL_SSE2(cpu_flags) && bit_depth > 8 && bit_depth <= 10) {
101
c->put_h264_chroma_pixels_tab[0] = ff_put_h264_chroma_mc8_10_sse2;
102
c->avg_h264_chroma_pixels_tab[0] = ff_avg_h264_chroma_mc8_10_sse2;
105
if (EXTERNAL_SSSE3(cpu_flags) && !high_bit_depth) {
106
c->put_h264_chroma_pixels_tab[0] = ff_put_h264_chroma_mc8_rnd_ssse3;
107
c->avg_h264_chroma_pixels_tab[0] = ff_avg_h264_chroma_mc8_rnd_ssse3;
108
c->put_h264_chroma_pixels_tab[1] = ff_put_h264_chroma_mc4_ssse3;
109
c->avg_h264_chroma_pixels_tab[1] = ff_avg_h264_chroma_mc4_ssse3;
112
if (EXTERNAL_AVX(cpu_flags) && bit_depth > 8 && bit_depth <= 10) {
113
// AVX implies !cache64.
114
// TODO: Port cache(32|64) detection from x264.
115
c->put_h264_chroma_pixels_tab[0] = ff_put_h264_chroma_mc8_10_avx;
116
c->avg_h264_chroma_pixels_tab[0] = ff_avg_h264_chroma_mc8_10_avx;