yading@10
|
1 /*
|
yading@10
|
2 * ARM NEON optimised DSP functions
|
yading@10
|
3 * Copyright (c) 2008 Mans Rullgard <mans@mansr.com>
|
yading@10
|
4 *
|
yading@10
|
5 * This file is part of FFmpeg.
|
yading@10
|
6 *
|
yading@10
|
7 * FFmpeg is free software; you can redistribute it and/or
|
yading@10
|
8 * modify it under the terms of the GNU Lesser General Public
|
yading@10
|
9 * License as published by the Free Software Foundation; either
|
yading@10
|
10 * version 2.1 of the License, or (at your option) any later version.
|
yading@10
|
11 *
|
yading@10
|
12 * FFmpeg is distributed in the hope that it will be useful,
|
yading@10
|
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
|
yading@10
|
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
yading@10
|
15 * Lesser General Public License for more details.
|
yading@10
|
16 *
|
yading@10
|
17 * You should have received a copy of the GNU Lesser General Public
|
yading@10
|
18 * License along with FFmpeg; if not, write to the Free Software
|
yading@10
|
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
yading@10
|
20 */
|
yading@10
|
21
|
yading@10
|
22 #include <stddef.h>
|
yading@10
|
23 #include <stdint.h>
|
yading@10
|
24
|
yading@10
|
25 #include "libavutil/attributes.h"
|
yading@10
|
26 #include "hpeldsp_arm.h"
|
yading@10
|
27
|
yading@10
|
28 void ff_put_pixels16_neon(uint8_t *, const uint8_t *, ptrdiff_t, int);
|
yading@10
|
29 void ff_put_pixels16_x2_neon(uint8_t *, const uint8_t *, ptrdiff_t, int);
|
yading@10
|
30 void ff_put_pixels16_y2_neon(uint8_t *, const uint8_t *, ptrdiff_t, int);
|
yading@10
|
31 void ff_put_pixels16_xy2_neon(uint8_t *, const uint8_t *, ptrdiff_t, int);
|
yading@10
|
32 void ff_put_pixels8_neon(uint8_t *, const uint8_t *, ptrdiff_t, int);
|
yading@10
|
33 void ff_put_pixels8_x2_neon(uint8_t *, const uint8_t *, ptrdiff_t, int);
|
yading@10
|
34 void ff_put_pixels8_y2_neon(uint8_t *, const uint8_t *, ptrdiff_t, int);
|
yading@10
|
35 void ff_put_pixels8_xy2_neon(uint8_t *, const uint8_t *, ptrdiff_t, int);
|
yading@10
|
36 void ff_put_pixels16_x2_no_rnd_neon(uint8_t *, const uint8_t *, ptrdiff_t, int);
|
yading@10
|
37 void ff_put_pixels16_y2_no_rnd_neon(uint8_t *, const uint8_t *, ptrdiff_t, int);
|
yading@10
|
38 void ff_put_pixels16_xy2_no_rnd_neon(uint8_t *, const uint8_t *, ptrdiff_t, int);
|
yading@10
|
39 void ff_put_pixels8_x2_no_rnd_neon(uint8_t *, const uint8_t *, ptrdiff_t, int);
|
yading@10
|
40 void ff_put_pixels8_y2_no_rnd_neon(uint8_t *, const uint8_t *, ptrdiff_t, int);
|
yading@10
|
41 void ff_put_pixels8_xy2_no_rnd_neon(uint8_t *, const uint8_t *, ptrdiff_t, int);
|
yading@10
|
42
|
yading@10
|
43 void ff_avg_pixels16_neon(uint8_t *, const uint8_t *, ptrdiff_t, int);
|
yading@10
|
44 void ff_avg_pixels16_x2_neon(uint8_t *, const uint8_t *, ptrdiff_t, int);
|
yading@10
|
45 void ff_avg_pixels16_y2_neon(uint8_t *, const uint8_t *, ptrdiff_t, int);
|
yading@10
|
46 void ff_avg_pixels16_xy2_neon(uint8_t *, const uint8_t *, ptrdiff_t, int);
|
yading@10
|
47 void ff_avg_pixels8_neon(uint8_t *, const uint8_t *, ptrdiff_t, int);
|
yading@10
|
48 void ff_avg_pixels8_x2_neon(uint8_t *, const uint8_t *, ptrdiff_t, int);
|
yading@10
|
49 void ff_avg_pixels8_y2_neon(uint8_t *, const uint8_t *, ptrdiff_t, int);
|
yading@10
|
50 void ff_avg_pixels8_xy2_neon(uint8_t *, const uint8_t *, ptrdiff_t, int);
|
yading@10
|
51 void ff_avg_pixels16_x2_no_rnd_neon(uint8_t *, const uint8_t *, ptrdiff_t, int);
|
yading@10
|
52 void ff_avg_pixels16_y2_no_rnd_neon(uint8_t *, const uint8_t *, ptrdiff_t, int);
|
yading@10
|
53 void ff_avg_pixels16_xy2_no_rnd_neon(uint8_t *, const uint8_t *, ptrdiff_t, int);
|
yading@10
|
54
|
yading@10
|
55 av_cold void ff_hpeldsp_init_neon(HpelDSPContext *c, int flags)
|
yading@10
|
56 {
|
yading@10
|
57 c->put_pixels_tab[0][0] = ff_put_pixels16_neon;
|
yading@10
|
58 c->put_pixels_tab[0][1] = ff_put_pixels16_x2_neon;
|
yading@10
|
59 c->put_pixels_tab[0][2] = ff_put_pixels16_y2_neon;
|
yading@10
|
60 c->put_pixels_tab[0][3] = ff_put_pixels16_xy2_neon;
|
yading@10
|
61 c->put_pixels_tab[1][0] = ff_put_pixels8_neon;
|
yading@10
|
62 c->put_pixels_tab[1][1] = ff_put_pixels8_x2_neon;
|
yading@10
|
63 c->put_pixels_tab[1][2] = ff_put_pixels8_y2_neon;
|
yading@10
|
64 c->put_pixels_tab[1][3] = ff_put_pixels8_xy2_neon;
|
yading@10
|
65
|
yading@10
|
66 c->put_no_rnd_pixels_tab[0][0] = ff_put_pixels16_neon;
|
yading@10
|
67 c->put_no_rnd_pixels_tab[0][1] = ff_put_pixels16_x2_no_rnd_neon;
|
yading@10
|
68 c->put_no_rnd_pixels_tab[0][2] = ff_put_pixels16_y2_no_rnd_neon;
|
yading@10
|
69 c->put_no_rnd_pixels_tab[0][3] = ff_put_pixels16_xy2_no_rnd_neon;
|
yading@10
|
70 c->put_no_rnd_pixels_tab[1][0] = ff_put_pixels8_neon;
|
yading@10
|
71 c->put_no_rnd_pixels_tab[1][1] = ff_put_pixels8_x2_no_rnd_neon;
|
yading@10
|
72 c->put_no_rnd_pixels_tab[1][2] = ff_put_pixels8_y2_no_rnd_neon;
|
yading@10
|
73 c->put_no_rnd_pixels_tab[1][3] = ff_put_pixels8_xy2_no_rnd_neon;
|
yading@10
|
74
|
yading@10
|
75 c->avg_pixels_tab[0][0] = ff_avg_pixels16_neon;
|
yading@10
|
76 c->avg_pixels_tab[0][1] = ff_avg_pixels16_x2_neon;
|
yading@10
|
77 c->avg_pixels_tab[0][2] = ff_avg_pixels16_y2_neon;
|
yading@10
|
78 c->avg_pixels_tab[0][3] = ff_avg_pixels16_xy2_neon;
|
yading@10
|
79 c->avg_pixels_tab[1][0] = ff_avg_pixels8_neon;
|
yading@10
|
80 c->avg_pixels_tab[1][1] = ff_avg_pixels8_x2_neon;
|
yading@10
|
81 c->avg_pixels_tab[1][2] = ff_avg_pixels8_y2_neon;
|
yading@10
|
82 c->avg_pixels_tab[1][3] = ff_avg_pixels8_xy2_neon;
|
yading@10
|
83
|
yading@10
|
84 c->avg_no_rnd_pixels_tab[0] = ff_avg_pixels16_neon;
|
yading@10
|
85 c->avg_no_rnd_pixels_tab[1] = ff_avg_pixels16_x2_no_rnd_neon;
|
yading@10
|
86 c->avg_no_rnd_pixels_tab[2] = ff_avg_pixels16_y2_no_rnd_neon;
|
yading@10
|
87 c->avg_no_rnd_pixels_tab[3] = ff_avg_pixels16_xy2_no_rnd_neon;
|
yading@10
|
88 }
|