Skip to content
Projects
Groups
Snippets
Help
Loading...
Sign in / Register
Toggle navigation
F
ffmpeg
Project
Project
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Packages
Packages
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
submodule
ffmpeg
Commits
55519926
Commit
55519926
authored
Jan 28, 2014
by
Diego Biurrun
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
x86: Make function prototype comments in assembly code consistent
This helps grepping for functions, among other things.
parent
edd1f833
Hide whitespace changes
Inline
Side-by-side
Showing
24 changed files
with
308 additions
and
246 deletions
+308
-246
dsputil.asm
libavcodec/x86/dsputil.asm
+11
-6
dsputilenc.asm
libavcodec/x86/dsputilenc.asm
+8
-7
fmtconvert.asm
libavcodec/x86/fmtconvert.asm
+7
-4
fpel.asm
libavcodec/x86/fpel.asm
+6
-3
h263_loopfilter.asm
libavcodec/x86/h263_loopfilter.asm
+2
-2
h264_chromamc.asm
libavcodec/x86/h264_chromamc.asm
+3
-2
h264_chromamc_10bit.asm
libavcodec/x86/h264_chromamc_10bit.asm
+6
-5
h264_deblock.asm
libavcodec/x86/h264_deblock.asm
+24
-18
h264_deblock_10bit.asm
libavcodec/x86/h264_deblock_10bit.asm
+14
-7
h264_idct.asm
libavcodec/x86/h264_idct.asm
+43
-42
h264_idct_10bit.asm
libavcodec/x86/h264_idct_10bit.asm
+16
-12
h264_intrapred.asm
libavcodec/x86/h264_intrapred.asm
+57
-39
h264_intrapred_10bit.asm
libavcodec/x86/h264_intrapred_10bit.asm
+41
-33
h264_qpel_10bit.asm
libavcodec/x86/h264_qpel_10bit.asm
+16
-16
h264_weight.asm
libavcodec/x86/h264_weight.asm
+5
-5
h264_weight_10bit.asm
libavcodec/x86/h264_weight_10bit.asm
+5
-4
hpeldsp.asm
libavcodec/x86/hpeldsp.asm
+11
-11
mpeg4qpel.asm
libavcodec/x86/mpeg4qpel.asm
+2
-2
proresdsp.asm
libavcodec/x86/proresdsp.asm
+2
-2
qpel.asm
libavcodec/x86/qpel.asm
+6
-3
rv40dsp.asm
libavcodec/x86/rv40dsp.asm
+4
-4
sbrdsp.asm
libavcodec/x86/sbrdsp.asm
+4
-4
vp8dsp.asm
libavcodec/x86/vp8dsp.asm
+10
-10
vp8dsp_loopfilter.asm
libavcodec/x86/vp8dsp_loopfilter.asm
+5
-5
No files found.
libavcodec/x86/dsputil.asm
View file @
55519926
...
...
@@ -34,7 +34,7 @@ pb_bswap32: db 3, 2, 1, 0, 7, 6, 5, 4, 11, 10, 9, 8, 15, 14, 13, 12
SECTION_TEXT
%macro
SCALARPRODUCT
0
; int scalarproduct_int16(int16_t *v1, int16_t *v2, int order)
; int
ff_
scalarproduct_int16(int16_t *v1, int16_t *v2, int order)
cglobal
scalarproduct_int16
,
3
,
3
,
3
,
v1
,
v2
,
order
shl
orderq
,
1
add
v1q
,
orderq
...
...
@@ -61,7 +61,8 @@ cglobal scalarproduct_int16, 3,3,3, v1, v2, order
movd
eax
,
m2
RET
; int scalarproduct_and_madd_int16(int16_t *v1, int16_t *v2, int16_t *v3, int order, int mul)
; int ff_scalarproduct_and_madd_int16(int16_t *v1, int16_t *v2, int16_t *v3,
; int order, int mul)
cglobal
scalarproduct_and_madd_int16
,
4
,
4
,
8
,
v1
,
v2
,
v3
,
order
,
mul
shl
orderq
,
1
movd
m7
,
mulm
...
...
@@ -157,7 +158,8 @@ align 16
%endif
%endmacro
; int scalarproduct_and_madd_int16(int16_t *v1, int16_t *v2, int16_t *v3, int order, int mul)
; int ff_scalarproduct_and_madd_int16(int16_t *v1, int16_t *v2, int16_t *v3,
; int order, int mul)
INIT_XMM
ssse3
cglobal
scalarproduct_and_madd_int16
,
4
,
5
,
10
,
v1
,
v2
,
v3
,
order
,
mul
shl
orderq
,
1
...
...
@@ -331,7 +333,9 @@ INIT_XMM ssse3, atom
APPLY_WINDOW_INT16
1
; void add_hfyu_median_prediction_mmxext(uint8_t *dst, const uint8_t *top, const uint8_t *diff, int w, int *left, int *left_top)
; void ff_add_hfyu_median_prediction_mmxext(uint8_t *dst, const uint8_t *top,
; const uint8_t *diff, int w,
; int *left, int *left_top)
INIT_MMX
mmxext
cglobal
add_hfyu_median_prediction
,
6
,
6
,
0
,
dst
,
top
,
diff
,
w
,
left
,
left_top
movq
mm0
,
[topq]
...
...
@@ -434,7 +438,8 @@ cglobal add_hfyu_median_prediction, 6,6,0, dst, top, diff, w, left, left_top
RET
%endmacro
; int add_hfyu_left_prediction(uint8_t *dst, const uint8_t *src, int w, int left)
; int ff_add_hfyu_left_prediction(uint8_t *dst, const uint8_t *src,
; int w, int left)
INIT_MMX
ssse3
cglobal
add_hfyu_left_prediction
,
3
,
3
,
7
,
dst
,
src
,
w
,
left
.
skip_prologue
:
...
...
@@ -595,7 +600,7 @@ VECTOR_CLIP_INT32 6, 1, 0, 0
add
r0
,
16
%endmacro
; void bswap_buf(uint32_t *dst, const uint32_t *src, int w);
; void
ff_
bswap_buf(uint32_t *dst, const uint32_t *src, int w);
%macro
BSWAP32_BUF
0
%if
cpuflag
(
ssse3
)
cglobal
bswap32_buf
,
3
,
4
,
3
...
...
libavcodec/x86/dsputilenc.asm
View file @
55519926
...
...
@@ -209,8 +209,8 @@ hadamard8x8_diff %+ SUFFIX:
hadamard8_16_wrapper
%1
,
3
%elif
cpuflag
(
mmx
)
ALIGN
16
; int
hadamard8_diff_##
cpu(void *s, uint8_t *src1, uint8_t *src2,
; int stride, int h)
; int
ff_hadamard8_diff_ ##
cpu(void *s, uint8_t *src1, uint8_t *src2,
;
int stride, int h)
; r0 = void *s = unused, int h = unused (always 8)
; note how r1, r2 and r3 are not clobbered in this function, so 16x16
; can simply call this 2x2x (and that's why we access rsp+gprsize
...
...
@@ -275,7 +275,7 @@ INIT_XMM ssse3
HADAMARD8_DIFF
9
INIT_XMM
sse2
;
sse16_sse2(void *v, uint8_t * pix1, uint8_t * pix2, int line_size, int h)
;
int ff_sse16_sse2(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h);
cglobal
sse16
,
5
,
5
,
8
shr
r4d
,
1
pxor
m0
,
m0
; mm0 = 0
...
...
@@ -335,7 +335,7 @@ cglobal sse16, 5, 5, 8
RET
INIT_MMX
mmx
; get_pixels_mmx(int16_t *block, const uint8_t *pixels, int line_size)
;
void ff_
get_pixels_mmx(int16_t *block, const uint8_t *pixels, int line_size)
cglobal
get_pixels
,
3
,
4
movsxdifnidn
r2
,
r2d
add
r0
,
128
...
...
@@ -392,7 +392,8 @@ cglobal get_pixels, 3, 4
RET
INIT_MMX
mmx
; diff_pixels_mmx(int16_t *block, const uint8_t *s1, const unint8_t *s2, stride)
; void ff_diff_pixels_mmx(int16_t *block, const uint8_t *s1, const uint8_t *s2,
; int stride);
cglobal
diff_pixels
,
4
,
5
movsxdifnidn
r3
,
r3d
pxor
m7
,
m7
...
...
@@ -418,7 +419,7 @@ cglobal diff_pixels, 4,5
REP_RET
INIT_MMX
mmx
;
pix_sum16_mmx(uint8_t *
pix, int line_size)
;
int ff_pix_sum16_mmx(uint8_t *
pix, int line_size)
cglobal
pix_sum16
,
2
,
3
movsxdifnidn
r1
,
r1d
mov
r2
,
r1
...
...
@@ -453,7 +454,7 @@ cglobal pix_sum16, 2, 3
RET
INIT_MMX
mmx
; pix_norm1_mmx(uint8_t *pix, int line_size)
;
int ff_
pix_norm1_mmx(uint8_t *pix, int line_size)
cglobal
pix_norm1
,
2
,
4
movsxdifnidn
r1
,
r1d
mov
r2
,
16
...
...
libavcodec/x86/fmtconvert.asm
View file @
55519926
...
...
@@ -31,9 +31,10 @@ SECTION_TEXT
%endif
%endmacro
;---------------------------------------------------------------------------------
; void int32_to_float_fmul_scalar(float *dst, const int32_t *src, float mul, int len);
;---------------------------------------------------------------------------------
;------------------------------------------------------------------------------
; void ff_int32_to_float_fmul_scalar(float *dst, const int32_t *src, float mul,
; int len);
;------------------------------------------------------------------------------
%macro
INT32_TO_FLOAT_FMUL_SCALAR
1
%if
UNIX64
cglobal
int32_to_float_fmul_scalar
,
3
,
3
,
%1
,
dst
,
src
,
len
...
...
@@ -243,8 +244,10 @@ FLOAT_TO_INT16_INTERLEAVE2
INIT_XMM
sse2
FLOAT_TO_INT16_INTERLEAVE2
;-----------------------------------------------------------------------------
; void ff_float_to_int16_interleave6(int16_t *dst, const float **src, int len)
;-----------------------------------------------------------------------------
%macro
FLOAT_TO_INT16_INTERLEAVE6
0
; void float_to_int16_interleave6_sse(int16_t *dst, const float **src, int len)
cglobal
float_to_int16_interleave6
,
2
,
8
,
0
,
dst
,
src
,
src1
,
src2
,
src3
,
src4
,
src5
,
len
%if
ARCH_X86_64
mov
lend
,
r2d
...
...
libavcodec/x86/fpel.asm
View file @
55519926
...
...
@@ -26,7 +26,8 @@
SECTION
.
text
INIT_MMX
mmxext
; void pixels(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
; void ff_put/avg_pixels(uint8_t *block, const uint8_t *pixels,
; ptrdiff_t line_size, int h)
%macro
PIXELS48
2
%if
%2
==
4
%define
OP
movh
...
...
@@ -65,7 +66,8 @@ PIXELS48 avg, 8
INIT_XMM
sse2
; void put_pixels16_sse2(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
; void ff_put_pixels16_sse2(uint8_t *block, const uint8_t *pixels,
; ptrdiff_t line_size, int h)
cglobal
put_pixels16
,
4
,
5
,
4
lea
r4
,
[
r2
*
3
]
.
loop
:
...
...
@@ -83,7 +85,8 @@ cglobal put_pixels16, 4,5,4
jnz
.
loop
REP_RET
; void avg_pixels16_sse2(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
; void ff_avg_pixels16_sse2(uint8_t *block, const uint8_t *pixels,
; ptrdiff_t line_size, int h)
cglobal
avg_pixels16
,
4
,
5
,
4
lea
r4
,
[
r2
*
3
]
.
loop
:
...
...
libavcodec/x86/h263_loopfilter.asm
View file @
55519926
...
...
@@ -99,7 +99,7 @@ SECTION_TEXT
%endmacro
INIT_MMX
mmx
; void
h263_v_loop_filter
(uint8_t *src, int stride, int qscale)
; void
ff_h263_v_loop_filter_mmx
(uint8_t *src, int stride, int qscale)
cglobal
h263_v_loop_filter
,
3
,
5
movsxdifnidn
r1
,
r1d
movsxdifnidn
r2
,
r2d
...
...
@@ -140,7 +140,7 @@ cglobal h263_v_loop_filter, 3,5
%endmacro
; void
h263_h_loop_filter
(uint8_t *src, int stride, int qscale)
; void
ff_h263_h_loop_filter_mmx
(uint8_t *src, int stride, int qscale)
INIT_MMX
mmx
cglobal
h263_h_loop_filter
,
3
,
5
,
0
,
32
movsxdifnidn
r1
,
r1d
...
...
libavcodec/x86/h264_chromamc.asm
View file @
55519926
...
...
@@ -103,8 +103,9 @@ SECTION .text
%else
%define
extra_regs
0
%endif
; rv40
; put/avg_h264_chroma_mc8_*(uint8_t *dst /*align 8*/, uint8_t *src /*align 1*/,
; int stride, int h, int mx, int my)
; void ff_put/avg_h264_chroma_mc8_*(uint8_t *dst /* align 8 */,
; uint8_t *src /* align 1 */,
; int stride, int h, int mx, int my)
cglobal
%1
_
%2
_chroma_mc8
%3
,
6
,
7
+
extra_regs
,
0
%if
ARCH_X86_64
movsxd
r2
,
r2d
...
...
libavcodec/x86/h264_chromamc_10bit.asm
View file @
55519926
...
...
@@ -57,11 +57,10 @@ SECTION .text
%endmacro
;-----------------------------------------------------------------------------
; void put/avg_h264_chroma_mc8(pixel *dst, pixel *src, int stride, int h, int mx, int my)
; void ff_put/avg_h264_chroma_mc8(pixel *dst, pixel *src, int stride, int h,
; int mx, int my)
;-----------------------------------------------------------------------------
%macro
CHROMA_MC8
1
; put/avg_h264_chroma_mc8_*(uint8_t *dst /*align 8*/, uint8_t *src /*align 1*/,
; int stride, int h, int mx, int my)
cglobal
%1
_h264_chroma_mc8_10
,
6
,
7
,
8
movsxdifnidn
r2
,
r2d
mov
r6d
,
r5d
...
...
@@ -150,7 +149,8 @@ cglobal %1_h264_chroma_mc8_10, 6,7,8
%endmacro
;-----------------------------------------------------------------------------
; void put/avg_h264_chroma_mc4(pixel *dst, pixel *src, int stride, int h, int mx, int my)
; void ff_put/avg_h264_chroma_mc4(pixel *dst, pixel *src, int stride, int h,
; int mx, int my)
;-----------------------------------------------------------------------------
;TODO: xmm mc4
%macro
MC4_OP
2
...
...
@@ -200,7 +200,8 @@ cglobal %1_h264_chroma_mc4_10, 6,6,7
%endmacro
;-----------------------------------------------------------------------------
; void put/avg_h264_chroma_mc2(pixel *dst, pixel *src, int stride, int h, int mx, int my)
; void ff_put/avg_h264_chroma_mc2(pixel *dst, pixel *src, int stride, int h,
; int mx, int my)
;-----------------------------------------------------------------------------
%macro
CHROMA_MC2
1
cglobal
%1
_h264_chroma_mc2_10
,
6
,
7
...
...
libavcodec/x86/h264_deblock.asm
View file @
55519926
...
...
@@ -283,7 +283,8 @@ cextern pb_3
%if
ARCH_X86_64
;-----------------------------------------------------------------------------
; void deblock_v_luma( uint8_t *pix, int stride, int alpha, int beta, int8_t *tc0 )
; void ff_deblock_v_luma(uint8_t *pix, int stride, int alpha, int beta,
; int8_t *tc0)
;-----------------------------------------------------------------------------
%macro
DEBLOCK_LUMA
0
cglobal
deblock_v_luma_8
,
5
,
5
,
10
...
...
@@ -328,7 +329,8 @@ cglobal deblock_v_luma_8, 5,5,10
RET
;-----------------------------------------------------------------------------
; void deblock_h_luma( uint8_t *pix, int stride, int alpha, int beta, int8_t *tc0 )
; void ff_deblock_h_luma(uint8_t *pix, int stride, int alpha, int beta,
; int8_t *tc0)
;-----------------------------------------------------------------------------
INIT_MMX
cpuname
cglobal
deblock_h_luma_8
,
5
,
9
,
0
,
0x60
+
16
*
WIN64
...
...
@@ -389,7 +391,8 @@ DEBLOCK_LUMA
%macro
DEBLOCK_LUMA
2
;-----------------------------------------------------------------------------
; void deblock_v8_luma( uint8_t *pix, int stride, int alpha, int beta, int8_t *tc0 )
; void ff_deblock_v8_luma(uint8_t *pix, int stride, int alpha, int beta,
; int8_t *tc0)
;-----------------------------------------------------------------------------
cglobal
deblock_
%1
_luma_8
,
5
,
5
,
8
,
2
*
%2
lea
r4
,
[
r1
*
3
]
...
...
@@ -437,7 +440,8 @@ cglobal deblock_%1_luma_8, 5,5,8,2*%2
RET
;-----------------------------------------------------------------------------
; void deblock_h_luma( uint8_t *pix, int stride, int alpha, int beta, int8_t *tc0 )
; void ff_deblock_h_luma(uint8_t *pix, int stride, int alpha, int beta,
; int8_t *tc0)
;-----------------------------------------------------------------------------
INIT_MMX
cpuname
cglobal
deblock_h_luma_8
,
0
,
5
,
8
,
0x60
+
HAVE_ALIGNED_STACK
*
12
...
...
@@ -635,7 +639,7 @@ DEBLOCK_LUMA v, 16
%endif
;-----------------------------------------------------------------------------
; void
deblock_v_luma_intra( uint8_t *pix, int stride, int alpha, int beta
)
; void
ff_deblock_v_luma_intra(uint8_t *pix, int stride, int alpha, int beta
)
;-----------------------------------------------------------------------------
%if
WIN64
cglobal
deblock_
%1
_luma_intra_8
,
4
,
6
,
16
,
0x10
...
...
@@ -695,7 +699,7 @@ cglobal deblock_%1_luma_intra_8, 4,6,16,ARCH_X86_64*0x50-0x50
INIT_MMX
cpuname
%if
ARCH_X86_64
;-----------------------------------------------------------------------------
; void
deblock_h_luma_intra( uint8_t *pix, int stride, int alpha, int beta
)
; void
ff_deblock_h_luma_intra(uint8_t *pix, int stride, int alpha, int beta
)
;-----------------------------------------------------------------------------
cglobal
deblock_h_luma_intra_8
,
4
,
9
,
0
,
0x80
movsxd
r7
,
r1d
...
...
@@ -798,7 +802,8 @@ INIT_MMX mmxext
%define
t6
r6
;-----------------------------------------------------------------------------
; void ff_deblock_v_chroma( uint8_t *pix, int stride, int alpha, int beta, int8_t *tc0 )
; void ff_deblock_v_chroma(uint8_t *pix, int stride, int alpha, int beta,
; int8_t *tc0)
;-----------------------------------------------------------------------------
cglobal
deblock_v_chroma_8
,
5
,
6
CHROMA_V_START
...
...
@@ -812,7 +817,8 @@ cglobal deblock_v_chroma_8, 5,6
RET
;-----------------------------------------------------------------------------
; void ff_deblock_h_chroma( uint8_t *pix, int stride, int alpha, int beta, int8_t *tc0 )
; void ff_deblock_h_chroma(uint8_t *pix, int stride, int alpha, int beta,
; int8_t *tc0)
;-----------------------------------------------------------------------------
cglobal
deblock_h_chroma_8
,
5
,
7
%if
UNIX64
...
...
@@ -864,9 +870,9 @@ ff_chroma_inter_body_mmxext:
%define
t5
r4
%define
t6
r5
;-----------------------------------------------------------------------------
; void ff_deblock_v_chroma_intra(
uint8_t *pix, int stride, int alpha, int beta
)
;-----------------------------------------------------------------------------
;-----------------------------------------------------------------------------
-
; void ff_deblock_v_chroma_intra(
uint8_t *pix, int stride, int alpha, int beta
)
;-----------------------------------------------------------------------------
-
cglobal
deblock_v_chroma_intra_8
,
4
,
5
CHROMA_V_START
movq
m0
,
[t5]
...
...
@@ -878,9 +884,9 @@ cglobal deblock_v_chroma_intra_8, 4,5
movq
[r0],
m2
RET
;-----------------------------------------------------------------------------
; void ff_deblock_h_chroma_intra(
uint8_t *pix, int stride, int alpha, int beta
)
;-----------------------------------------------------------------------------
;-----------------------------------------------------------------------------
-
; void ff_deblock_h_chroma_intra(
uint8_t *pix, int stride, int alpha, int beta
)
;-----------------------------------------------------------------------------
-
cglobal
deblock_h_chroma_intra_8
,
4
,
6
CHROMA_H_START
TRANSPOSE4x8_LOAD
bw
,
wd
,
dq
,
PASS8ROWS
(
t5
,
r0
,
r1
,
t6
)
...
...
@@ -904,10 +910,10 @@ ff_chroma_intra_body_mmxext:
ret
;-----------------------------------------------------------------------------
; void h264_loop_filter_strength(int16_t bs[2][4][4], uint8_t nnz[40],
; int8_t ref[2][40], int16_t mv[2][40][2],
; int bidir, int edges, int step,
; int mask_mv0, int mask_mv1, int field);
; void
ff_
h264_loop_filter_strength(int16_t bs[2][4][4], uint8_t nnz[40],
;
int8_t ref[2][40], int16_t mv[2][40][2],
;
int bidir, int edges, int step,
;
int mask_mv0, int mask_mv1, int field);
;
; bidir is 0 or 1
; edges is 1 or 4
...
...
libavcodec/x86/h264_deblock_10bit.asm
View file @
55519926
...
...
@@ -152,7 +152,8 @@ cextern pw_4
%macro
DEBLOCK_LUMA
0
;-----------------------------------------------------------------------------
; void deblock_v_luma( uint16_t *pix, int stride, int alpha, int beta, int8_t *tc0 )
; void ff_deblock_v_luma_10(uint16_t *pix, int stride, int alpha, int beta,
; int8_t *tc0)
;-----------------------------------------------------------------------------
cglobal
deblock_v_luma_10
,
5
,
5
,
8
*
(
mmsize
/
16
)
%
assign
pad
5
*
mmsize
+
12
-
(
stack_offset
&
15
)
...
...
@@ -598,7 +599,8 @@ DEBLOCK_LUMA_64
%if
ARCH_X86_64
;-----------------------------------------------------------------------------
; void deblock_v_luma_intra( uint16_t *pix, int stride, int alpha, int beta )
; void ff_deblock_v_luma_intra_10(uint16_t *pix, int stride, int alpha,
; int beta)
;-----------------------------------------------------------------------------
%macro
DEBLOCK_LUMA_INTRA_64
0
cglobal
deblock_v_luma_intra_10
,
4
,
7
,
16
...
...
@@ -649,7 +651,8 @@ cglobal deblock_v_luma_intra_10, 4,7,16
REP_RET
;-----------------------------------------------------------------------------
; void deblock_h_luma_intra( uint16_t *pix, int stride, int alpha, int beta )
; void ff_deblock_h_luma_intra_10(uint16_t *pix, int stride, int alpha,
; int beta)
;-----------------------------------------------------------------------------
cglobal
deblock_h_luma_intra_10
,
4
,
7
,
16
%
define
t0
m15
...
...
@@ -719,7 +722,8 @@ DEBLOCK_LUMA_INTRA_64
%macro
DEBLOCK_LUMA_INTRA
0
;-----------------------------------------------------------------------------
; void deblock_v_luma_intra( uint16_t *pix, int stride, int alpha, int beta )
; void ff_deblock_v_luma_intra_10(uint16_t *pix, int stride, int alpha,
; int beta)
;-----------------------------------------------------------------------------
cglobal
deblock_v_luma_intra_10
,
4
,
7
,
8
*
(
mmsize
/
16
)
LUMA_INTRA_INIT
3
...
...
@@ -747,7 +751,8 @@ cglobal deblock_v_luma_intra_10, 4,7,8*(mmsize/16)
RET
;-----------------------------------------------------------------------------
; void deblock_h_luma_intra( uint16_t *pix, int stride, int alpha, int beta )
; void ff_deblock_h_luma_intra_10(uint16_t *pix, int stride, int alpha,
; int beta)
;-----------------------------------------------------------------------------
cglobal
deblock_h_luma_intra_10
,
4
,
7
,
8
*
(
mmsize
/
16
)
LUMA_INTRA_INIT
8
...
...
@@ -843,7 +848,8 @@ DEBLOCK_LUMA_INTRA
%macro
DEBLOCK_CHROMA
0
;-----------------------------------------------------------------------------
; void deblock_v_chroma( uint16_t *pix, int stride, int alpha, int beta, int8_t *tc0 )
; void ff_deblock_v_chroma_10(uint16_t *pix, int stride, int alpha, int beta,
; int8_t *tc0)
;-----------------------------------------------------------------------------
cglobal
deblock_v_chroma_10
,
5
,
7
-
(
mmsize
/
16
),
8
*
(
mmsize
/
16
)
mov
r5
,
r0
...
...
@@ -877,7 +883,8 @@ cglobal deblock_v_chroma_10, 5,7-(mmsize/16),8*(mmsize/16)
%endif
;-----------------------------------------------------------------------------
; void deblock_v_chroma_intra( uint16_t *pix, int stride, int alpha, int beta )
; void ff_deblock_v_chroma_intra_10(uint16_t *pix, int stride, int alpha,
; int beta)
;-----------------------------------------------------------------------------
cglobal
deblock_v_chroma_intra_10
,
4
,
6
-
(
mmsize
/
16
),
8
*
(
mmsize
/
16
)
mov
r4
,
r0
...
...
libavcodec/x86/h264_idct.asm
View file @
55519926
...
...
@@ -80,7 +80,7 @@ SECTION .text
%endmacro
INIT_MMX
mmx
; ff_h264_idct_add_8_mmx(uint8_t *dst, int16_t *block, int stride)
;
void
ff_h264_idct_add_8_mmx(uint8_t *dst, int16_t *block, int stride)
cglobal
h264_idct_add_8
,
3
,
3
,
0
IDCT4_ADD
r0
,
r1
,
r2
RET
...
...
@@ -202,7 +202,7 @@ cglobal h264_idct_add_8, 3, 3, 0
%endmacro
INIT_MMX
mmx
; ff_h264_idct8_add_8_mmx(uint8_t *dst, int16_t *block, int stride)
;
void
ff_h264_idct8_add_8_mmx(uint8_t *dst, int16_t *block, int stride)
cglobal
h264_idct8_add_8
,
3
,
4
,
0
%
assign
pad
128
+
4
-
(
stack_offset
&
7
)
SUB
rsp
,
pad
...
...
@@ -270,7 +270,7 @@ cglobal h264_idct8_add_8, 3, 4, 0
%endmacro
INIT_XMM
sse2
; ff_h264_idct8_add_8_sse2(uint8_t *dst, int16_t *block, int stride)
;
void
ff_h264_idct8_add_8_sse2(uint8_t *dst, int16_t *block, int stride)
cglobal
h264_idct8_add_8
,
3
,
4
,
10
IDCT8_ADD_SSE
r0
,
r1
,
r2
,
r3
RET
...
...
@@ -307,7 +307,7 @@ cglobal h264_idct8_add_8, 3, 4, 10
%endmacro
INIT_MMX
mmxext
; ff_h264_idct_dc_add_8_mmxext(uint8_t *dst, int16_t *block, int stride)
;
void
ff_h264_idct_dc_add_8_mmxext(uint8_t *dst, int16_t *block, int stride)
%if
ARCH_X86_64
cglobal
h264_idct_dc_add_8
,
3
,
4
,
0
movsx
r3
,
word
[r1]
...
...
@@ -316,7 +316,7 @@ cglobal h264_idct_dc_add_8, 3, 4, 0
DC_ADD_MMXEXT_OP
movh
,
r0
,
r2
,
r3
RET
; ff_h264_idct8_dc_add_8_mmxext(uint8_t *dst, int16_t *block, int stride)
;
void
ff_h264_idct8_dc_add_8_mmxext(uint8_t *dst, int16_t *block, int stride)
cglobal
h264_idct8_dc_add_8
,
3
,
4
,
0
movsx
r3
,
word
[r1]
mov
dword
[r1],
0
...
...
@@ -326,7 +326,7 @@ cglobal h264_idct8_dc_add_8, 3, 4, 0
DC_ADD_MMXEXT_OP
mova
,
r0
,
r2
,
r3
RET
%else
; ff_h264_idct_dc_add_8_mmxext(uint8_t *dst, int16_t *block, int stride)
;
void
ff_h264_idct_dc_add_8_mmxext(uint8_t *dst, int16_t *block, int stride)
cglobal
h264_idct_dc_add_8
,
2
,
3
,
0
movsx
r2
,
word
[r1]
mov
dword
[r1],
0
...
...
@@ -335,7 +335,7 @@ cglobal h264_idct_dc_add_8, 2, 3, 0
DC_ADD_MMXEXT_OP
movh
,
r0
,
r1
,
r2
RET
; ff_h264_idct8_dc_add_8_mmxext(uint8_t *dst, int16_t *block, int stride)
;
void
ff_h264_idct8_dc_add_8_mmxext(uint8_t *dst, int16_t *block, int stride)
cglobal
h264_idct8_dc_add_8
,
2
,
3
,
0
movsx
r2
,
word
[r1]
mov
dword
[r1],
0
...
...
@@ -348,9 +348,9 @@ cglobal h264_idct8_dc_add_8, 2, 3, 0
%endif
INIT_MMX
mmx
; ff_h264_idct_add16_8_mmx(uint8_t *dst, const int *block_offset,
; int16_t *block, int stride,
; const uint8_t nnzc[6 * 8])
;
void
ff_h264_idct_add16_8_mmx(uint8_t *dst, const int *block_offset,
;
int16_t *block, int stride,
;
const uint8_t nnzc[6 * 8])
cglobal
h264_idct_add16_8
,
5
,
7
+
npicregs
,
0
,
dst
,
block_offset
,
block
,
stride
,
nnzc
,
cntr
,
coeff
,
picreg
xor
r5
,
r5
%ifdef
PIC
...
...
@@ -371,9 +371,9 @@ cglobal h264_idct_add16_8, 5, 7 + npicregs, 0, dst, block_offset, block, stride,
jl
.
nextblock
REP_RET
; ff_h264_idct8_add4_8_mmx(uint8_t *dst, const int *block_offset,
; int16_t *block, int stride,
; const uint8_t nnzc[6 * 8])
;
void
ff_h264_idct8_add4_8_mmx(uint8_t *dst, const int *block_offset,
;
int16_t *block, int stride,
;
const uint8_t nnzc[6 * 8])
cglobal
h264_idct8_add4_8
,
5
,
7
+
npicregs
,
0
,
dst
,
block_offset
,
block
,
stride
,
nnzc
,
cntr
,
coeff
,
picreg
%
assign
pad
128
+
4
-
(
stack_offset
&
7
)
SUB
rsp
,
pad
...
...
@@ -405,9 +405,9 @@ cglobal h264_idct8_add4_8, 5, 7 + npicregs, 0, dst, block_offset, block, stride,
RET
INIT_MMX
mmxext
; ff_h264_idct_add16_8_mmxext(uint8_t *dst, const int *block_offset,
; int16_t *block, int stride,
; const uint8_t nnzc[6 * 8])
;
void
ff_h264_idct_add16_8_mmxext(uint8_t *dst, const int *block_offset,
;
int16_t *block, int stride,
;
const uint8_t nnzc[6 * 8])
cglobal
h264_idct_add16_8
,
5
,
8
+
npicregs
,
0
,
dst1
,
block_offset
,
block
,
stride
,
nnzc
,
cntr
,
coeff
,
dst2
,
picreg
xor
r5
,
r5
%ifdef
PIC
...
...
@@ -452,9 +452,9 @@ cglobal h264_idct_add16_8, 5, 8 + npicregs, 0, dst1, block_offset, block, stride
REP_RET
INIT_MMX
mmx
; ff_h264_idct_add16intra_8_mmx(uint8_t *dst, const int *block_offset,
; int16_t *block, int stride,
; const uint8_t nnzc[6 * 8])
;
void
ff_h264_idct_add16intra_8_mmx(uint8_t *dst, const int *block_offset,
;
int16_t *block, int stride,
;
const uint8_t nnzc[6 * 8])
cglobal
h264_idct_add16intra_8
,
5
,
7
+
npicregs
,
0
,
dst
,
block_offset
,
block
,
stride
,
nnzc
,
cntr
,
coeff
,
picreg
xor
r5
,
r5
%ifdef
PIC
...
...
@@ -477,9 +477,9 @@ cglobal h264_idct_add16intra_8, 5, 7 + npicregs, 0, dst, block_offset, block, st
REP_RET
INIT_MMX
mmxext
; ff_h264_idct_add16intra_8_mmxext(uint8_t *dst, const int *block_offset,
; int16_t *block, int stride,
; const uint8_t nnzc[6 * 8])
;
void
ff_h264_idct_add16intra_8_mmxext(uint8_t *dst, const int *block_offset,
;
int16_t *block, int stride,
;
const uint8_t nnzc[6 * 8])
cglobal
h264_idct_add16intra_8
,
5
,
8
+
npicregs
,
0
,
dst1
,
block_offset
,
block
,
stride
,
nnzc
,
cntr
,
coeff
,
dst2
,
picreg
xor
r5
,
r5
%ifdef
PIC
...
...
@@ -521,9 +521,9 @@ cglobal h264_idct_add16intra_8, 5, 8 + npicregs, 0, dst1, block_offset, block, s
jl
.
nextblock
REP_RET
; ff_h264_idct8_add4_8_mmxext(uint8_t *dst, const int *block_offset,
; int16_t *block, int stride,
; const uint8_t nnzc[6 * 8])
;
void
ff_h264_idct8_add4_8_mmxext(uint8_t *dst, const int *block_offset,
;
int16_t *block, int stride,
;
const uint8_t nnzc[6 * 8])
cglobal
h264_idct8_add4_8
,
5
,
8
+
npicregs
,
0
,
dst1
,
block_offset
,
block
,
stride
,
nnzc
,
cntr
,
coeff
,
dst2
,
picreg
%
assign
pad
128
+
4
-
(
stack_offset
&
7
)
SUB
rsp
,
pad
...
...
@@ -583,9 +583,9 @@ cglobal h264_idct8_add4_8, 5, 8 + npicregs, 0, dst1, block_offset, block, stride
RET
INIT_XMM
sse2
; ff_h264_idct8_add4_8_sse2(uint8_t *dst, const int *block_offset,
; int16_t *block, int stride,
; const uint8_t nnzc[6 * 8])
;
void
ff_h264_idct8_add4_8_sse2(uint8_t *dst, const int *block_offset,
;
int16_t *block, int stride,
;
const uint8_t nnzc[6 * 8])
cglobal
h264_idct8_add4_8
,
5
,
8
+
npicregs
,
10
,
dst1
,
block_offset
,
block
,
stride
,
nnzc
,
cntr
,
coeff
,
dst2
,
picreg
xor
r5
,
r5
%ifdef
PIC
...
...
@@ -660,8 +660,9 @@ h264_idct_add8_mmx_plane:
jnz
.
nextblock
rep
ret
; ff_h264_idct_add8_8_mmx(uint8_t **dest, const int *block_offset,
; int16_t *block, int stride, const uint8_t nnzc[6 * 8])
; void ff_h264_idct_add8_8_mmx(uint8_t **dest, const int *block_offset,
; int16_t *block, int stride,
; const uint8_t nnzc[6 * 8])
cglobal
h264_idct_add8_8
,
5
,
8
+
npicregs
,
0
,
dst1
,
block_offset
,
block
,
stride
,
nnzc
,
cntr
,
coeff
,
dst2
,
picreg
mov
r5
,
16
add
r2
,
512
...
...
@@ -725,9 +726,9 @@ h264_idct_add8_mmxext_plane:
rep
ret
INIT_MMX
mmxext
; ff_h264_idct_add8_8_mmxext(uint8_t **dest, const int *block_offset,
; int16_t *block, int stride,
; const uint8_t nnzc[6 * 8])
;
void
ff_h264_idct_add8_8_mmxext(uint8_t **dest, const int *block_offset,
;
int16_t *block, int stride,
;
const uint8_t nnzc[6 * 8])
cglobal
h264_idct_add8_8
,
5
,
8
+
npicregs
,
0
,
dst1
,
block_offset
,
block
,
stride
,
nnzc
,
cntr
,
coeff
,
dst2
,
picreg
mov
r5
,
16
add
r2
,
512
...
...
@@ -809,9 +810,9 @@ h264_add8x4_idct_sse2:
%endif
%endmacro
; ff_h264_idct_add16_8_sse2(uint8_t *dst, const int *block_offset,
; int16_t *block, int stride,
; const uint8_t nnzc[6 * 8])
;
void
ff_h264_idct_add16_8_sse2(uint8_t *dst, const int *block_offset,
;
int16_t *block, int stride,
;
const uint8_t nnzc[6 * 8])
cglobal
h264_idct_add16_8
,
5
,
5
+
ARCH_X86_64
,
8
%if
ARCH_X86_64
mov
r5
,
r0
...
...
@@ -857,9 +858,9 @@ cglobal h264_idct_add16_8, 5, 5 + ARCH_X86_64, 8
%endif
%endmacro
; ff_h264_idct_add16intra_8_sse2(uint8_t *dst, const int *block_offset,
; int16_t *block, int stride,
; const uint8_t nnzc[6 * 8])
;
void
ff_h264_idct_add16intra_8_sse2(uint8_t *dst, const int *block_offset,
;
int16_t *block, int stride,
;
const uint8_t nnzc[6 * 8])
cglobal
h264_idct_add16intra_8
,
5
,
7
+
ARCH_X86_64
,
8
%if
ARCH_X86_64
mov
r7
,
r0
...
...
@@ -909,9 +910,9 @@ cglobal h264_idct_add16intra_8, 5, 7 + ARCH_X86_64, 8
%endif
%endmacro
; ff_h264_idct_add8_8_sse2(uint8_t **dest, const int *block_offset,
; int16_t *block, int stride,
; const uint8_t nnzc[6 * 8])
;
void
ff_h264_idct_add8_8_sse2(uint8_t **dest, const int *block_offset,
;
int16_t *block, int stride,
;
const uint8_t nnzc[6 * 8])
cglobal
h264_idct_add8_8
,
5
,
7
+
ARCH_X86_64
,
8
add
r2
,
512
%if
ARCH_X86_64
...
...
libavcodec/x86/h264_idct_10bit.asm
View file @
55519926
...
...
@@ -32,7 +32,7 @@ pd_32: times 4 dd 32
SECTION
.
text
;-----------------------------------------------------------------------------
; void
h264_idct_add
(pixel *dst, int16_t *block, int stride)
; void
ff_h264_idct_add_10
(pixel *dst, int16_t *block, int stride)
;-----------------------------------------------------------------------------
%macro
STORE_DIFFx2
6
psrad
%1
,
6
...
...
@@ -87,8 +87,9 @@ INIT_XMM avx
IDCT_ADD_10
;-----------------------------------------------------------------------------
; h264_idct_add16(pixel *dst, const int *block_offset, int16_t *block,
; int stride, const uint8_t nnzc[6*8])
; void ff_h264_idct_add16_10(pixel *dst, const int *block_offset,
; int16_t *block, int stride,
; const uint8_t nnzc[6*8])
;-----------------------------------------------------------------------------
;;;;;;; NO FATE SAMPLES TRIGGER THIS
%macro
ADD4x4IDCT
0
...
...
@@ -158,7 +159,7 @@ INIT_XMM avx
IDCT_ADD16_10
;-----------------------------------------------------------------------------
; void
h264_idct_dc_add
(pixel *dst, int16_t *block, int stride)
; void
ff_h264_idct_dc_add_10
(pixel *dst, int16_t *block, int stride)
;-----------------------------------------------------------------------------
%macro
IDCT_DC_ADD_OP_10
3
pxor
m5
,
m5
...
...
@@ -200,7 +201,7 @@ cglobal h264_idct_dc_add_10,3,3
RET
;-----------------------------------------------------------------------------
; void
h264_idct8_dc_add
(pixel *dst, int16_t *block, int stride)
; void
ff_h264_idct8_dc_add_10
(pixel *dst, int16_t *block, int stride)
;-----------------------------------------------------------------------------
%macro
IDCT8_DC_ADD
0
cglobal
h264_idct8_dc_add_10
,
3
,
4
,
7
...
...
@@ -223,8 +224,9 @@ INIT_XMM avx
IDCT8_DC_ADD
;-----------------------------------------------------------------------------
; h264_idct_add16intra(pixel *dst, const int *block_offset, int16_t *block,
; int stride, const uint8_t nnzc[6*8])
; void ff_h264_idct_add16intra_10(pixel *dst, const int *block_offset,
; int16_t *block, int stride,
; const uint8_t nnzc[6*8])
;-----------------------------------------------------------------------------
%macro
AC
1
.
ac%1:
...
...
@@ -296,8 +298,9 @@ IDCT_ADD16INTRA_10
%assign
last_block
36
;-----------------------------------------------------------------------------
; h264_idct_add8(pixel **dst, const int *block_offset, int16_t *block,
; int stride, const uint8_t nnzc[6*8])
; void ff_h264_idct_add8_10(pixel **dst, const int *block_offset,
; int16_t *block, int stride,
; const uint8_t nnzc[6*8])
;-----------------------------------------------------------------------------
%macro
IDCT_ADD8
0
cglobal
h264_idct_add8_10
,
5
,
8
,
7
...
...
@@ -331,7 +334,7 @@ INIT_XMM avx
IDCT_ADD8
;-----------------------------------------------------------------------------
; void
h264_idct8_add
(pixel *dst, int16_t *block, int stride)
; void
ff_h264_idct8_add_10
(pixel *dst, int16_t *block, int stride)
;-----------------------------------------------------------------------------
%macro
IDCT8_1D
2
SWAP
0
,
1
...
...
@@ -538,8 +541,9 @@ INIT_XMM avx
IDCT8_ADD
;-----------------------------------------------------------------------------
; h264_idct8_add4(pixel **dst, const int *block_offset, int16_t *block,
; int stride, const uint8_t nnzc[6*8])
; void ff_h264_idct8_add4_10(pixel **dst, const int *block_offset,
; int16_t *block, int stride,
; const uint8_t nnzc[6*8])
;-----------------------------------------------------------------------------
;;;;;;; NO FATE SAMPLES TRIGGER THIS
%macro
IDCT8_ADD4_OP
2
...
...
libavcodec/x86/h264_intrapred.asm
View file @
55519926
...
...
@@ -49,7 +49,7 @@ cextern pw_17
cextern
pw_32
;-----------------------------------------------------------------------------
; void pred16x16_vertical_8(uint8_t *src, int stride)
; void
ff_
pred16x16_vertical_8(uint8_t *src, int stride)
;-----------------------------------------------------------------------------
INIT_MMX
mmx
...
...
@@ -85,7 +85,7 @@ cglobal pred16x16_vertical_8, 2,3
REP_RET
;-----------------------------------------------------------------------------
; void pred16x16_horizontal_8(uint8_t *src, int stride)
; void
ff_
pred16x16_horizontal_8(uint8_t *src, int stride)
;-----------------------------------------------------------------------------
%macro
PRED16x16_H
0
...
...
@@ -126,7 +126,7 @@ INIT_XMM ssse3
PRED16x16_H
;-----------------------------------------------------------------------------
; void pred16x16_dc_8(uint8_t *src, int stride)
; void
ff_
pred16x16_dc_8(uint8_t *src, int stride)
;-----------------------------------------------------------------------------
%macro
PRED16x16_DC
0
...
...
@@ -188,7 +188,7 @@ INIT_XMM ssse3
PRED16x16_DC
;-----------------------------------------------------------------------------
; void pred16x16_tm_vp8_8(uint8_t *src, int stride)
; void
ff_
pred16x16_tm_vp8_8(uint8_t *src, int stride)
;-----------------------------------------------------------------------------
%macro
PRED16x16_TM
0
...
...
@@ -269,7 +269,7 @@ cglobal pred16x16_tm_vp8_8, 2,6,6
REP_RET
;-----------------------------------------------------------------------------
; void pred16x16_plane_*_8(uint8_t *src, int stride)
; void
ff_
pred16x16_plane_*_8(uint8_t *src, int stride)
;-----------------------------------------------------------------------------
%macro
H264_PRED16x16_PLANE
1
...
...
@@ -550,7 +550,7 @@ H264_PRED16x16_PLANE rv40
H264_PRED16x16_PLANE
svq3
;-----------------------------------------------------------------------------
; void pred8x8_plane_8(uint8_t *src, int stride)
; void
ff_
pred8x8_plane_8(uint8_t *src, int stride)
;-----------------------------------------------------------------------------
%macro
H264_PRED8x8_PLANE
0
...
...
@@ -724,7 +724,7 @@ INIT_XMM ssse3
H264_PRED8x8_PLANE
;-----------------------------------------------------------------------------
; void pred8x8_vertical_8(uint8_t *src, int stride)
; void
ff_
pred8x8_vertical_8(uint8_t *src, int stride)
;-----------------------------------------------------------------------------
INIT_MMX
mmx
...
...
@@ -741,7 +741,7 @@ cglobal pred8x8_vertical_8, 2,2
RET
;-----------------------------------------------------------------------------
; void pred8x8_horizontal_8(uint8_t *src, int stride)
; void
ff_
pred8x8_horizontal_8(uint8_t *src, int stride)
;-----------------------------------------------------------------------------
%macro
PRED8x8_H
0
...
...
@@ -769,7 +769,7 @@ INIT_MMX ssse3
PRED8x8_H
;-----------------------------------------------------------------------------
; void pred8x8_top_dc_8_mmxext(uint8_t *src, int stride)
; void
ff_
pred8x8_top_dc_8_mmxext(uint8_t *src, int stride)
;-----------------------------------------------------------------------------
INIT_MMX
mmxext
cglobal
pred8x8_top_dc_8
,
2
,
5
...
...
@@ -803,7 +803,7 @@ cglobal pred8x8_top_dc_8, 2,5
RET
;-----------------------------------------------------------------------------
; void pred8x8_dc_8_mmxext(uint8_t *src, int stride)
; void
ff_
pred8x8_dc_8_mmxext(uint8_t *src, int stride)
;-----------------------------------------------------------------------------
INIT_MMX
mmxext
...
...
@@ -864,7 +864,7 @@ cglobal pred8x8_dc_8, 2,5
RET
;-----------------------------------------------------------------------------
; void pred8x8_dc_rv40_8(uint8_t *src, int stride)
; void
ff_
pred8x8_dc_rv40_8(uint8_t *src, int stride)
;-----------------------------------------------------------------------------
INIT_MMX
mmxext
...
...
@@ -901,7 +901,7 @@ cglobal pred8x8_dc_rv40_8, 2,7
REP_RET
;-----------------------------------------------------------------------------
; void pred8x8_tm_vp8_8(uint8_t *src, int stride)
; void
ff_
pred8x8_tm_vp8_8(uint8_t *src, int stride)
;-----------------------------------------------------------------------------
%macro
PRED8x8_TM
0
...
...
@@ -1013,7 +1013,8 @@ cglobal pred8x8_tm_vp8_8, 2,3,6
%endmacro
;-----------------------------------------------------------------------------
; void pred8x8l_top_dc_8(uint8_t *src, int has_topleft, int has_topright, int stride)
; void ff_pred8x8l_top_dc_8(uint8_t *src, int has_topleft, int has_topright,
; int stride)
;-----------------------------------------------------------------------------
%macro
PRED8x8L_TOP_DC
0
cglobal
pred8x8l_top_dc_8
,
4
,
4
...
...
@@ -1068,7 +1069,8 @@ INIT_MMX ssse3
PRED8x8L_TOP_DC
;-----------------------------------------------------------------------------
;void pred8x8l_dc_8(uint8_t *src, int has_topleft, int has_topright, int stride)
; void ff_pred8x8l_dc_8(uint8_t *src, int has_topleft, int has_topright,
; int stride)
;-----------------------------------------------------------------------------
%macro
PRED8x8L_DC
0
...
...
@@ -1171,7 +1173,8 @@ INIT_MMX ssse3
PRED8x8L_DC
;-----------------------------------------------------------------------------
; void pred8x8l_horizontal_8(uint8_t *src, int has_topleft, int has_topright, int stride)
; void ff_pred8x8l_horizontal_8(uint8_t *src, int has_topleft,
; int has_topright, int stride)
;-----------------------------------------------------------------------------
%macro
PRED8x8L_HORIZONTAL
0
...
...
@@ -1242,7 +1245,8 @@ INIT_MMX ssse3
PRED8x8L_HORIZONTAL
;-----------------------------------------------------------------------------
; void pred8x8l_vertical_8(uint8_t *src, int has_topleft, int has_topright, int stride)
; void ff_pred8x8l_vertical_8(uint8_t *src, int has_topleft, int has_topright,
; int stride)
;-----------------------------------------------------------------------------
%macro
PRED8x8L_VERTICAL
0
...
...
@@ -1292,7 +1296,8 @@ INIT_MMX ssse3
PRED8x8L_VERTICAL
;-----------------------------------------------------------------------------
;void pred8x8l_down_left_8(uint8_t *src, int has_topleft, int has_topright, int stride)
; void ff_pred8x8l_down_left_8(uint8_t *src, int has_topleft,
; int has_topright, int stride)
;-----------------------------------------------------------------------------
INIT_MMX
mmxext
...
...
@@ -1492,7 +1497,8 @@ INIT_MMX ssse3
PRED8x8L_DOWN_LEFT
;-----------------------------------------------------------------------------
;void pred8x8l_down_right_8_mmxext(uint8_t *src, int has_topleft, int has_topright, int stride)
; void ff_pred8x8l_down_right_8_mmxext(uint8_t *src, int has_topleft,
; int has_topright, int stride)
;-----------------------------------------------------------------------------
INIT_MMX
mmxext
...
...
@@ -1743,7 +1749,8 @@ INIT_MMX ssse3
PRED8x8L_DOWN_RIGHT
;-----------------------------------------------------------------------------
; void pred8x8l_vertical_right_8(uint8_t *src, int has_topleft, int has_topright, int stride)
; void ff_pred8x8l_vertical_right_8(uint8_t *src, int has_topleft,
; int has_topright, int stride)
;-----------------------------------------------------------------------------
INIT_MMX
mmxext
...
...
@@ -1970,7 +1977,8 @@ INIT_MMX ssse3
PRED8x8L_VERTICAL_RIGHT
;-----------------------------------------------------------------------------
;void pred8x8l_vertical_left_8(uint8_t *src, int has_topleft, int has_topright, int stride)
; void ff_pred8x8l_vertical_left_8(uint8_t *src, int has_topleft,
; int has_topright, int stride)
;-----------------------------------------------------------------------------
%macro
PRED8x8L_VERTICAL_LEFT
0
...
...
@@ -2059,7 +2067,8 @@ INIT_MMX ssse3
PRED8x8L_VERTICAL_LEFT
;-----------------------------------------------------------------------------
; void pred8x8l_horizontal_up_8(uint8_t *src, int has_topleft, int has_topright, int stride)
; void ff_pred8x8l_horizontal_up_8(uint8_t *src, int has_topleft,
; int has_topright, int stride)
;-----------------------------------------------------------------------------
%macro
PRED8x8L_HORIZONTAL_UP
0
...
...
@@ -2146,7 +2155,8 @@ INIT_MMX ssse3
PRED8x8L_HORIZONTAL_UP
;-----------------------------------------------------------------------------
;void pred8x8l_horizontal_down_8(uint8_t *src, int has_topleft, int has_topright, int stride)
; void ff_pred8x8l_horizontal_down_8(uint8_t *src, int has_topleft,
; int has_topright, int stride)
;-----------------------------------------------------------------------------
INIT_MMX
mmxext
...
...
@@ -2393,9 +2403,9 @@ PRED8x8L_HORIZONTAL_DOWN
INIT_MMX
ssse3
PRED8x8L_HORIZONTAL_DOWN
;-----------------------------------------------------------------------------
; void pred4x4_dc_8_mmxext(uint8_t *src, const uint8_t *topright, int stride)
;-----------------------------------------------------------------------------
;-----------------------------------------------------------------------------
--
; void
ff_
pred4x4_dc_8_mmxext(uint8_t *src, const uint8_t *topright, int stride)
;-----------------------------------------------------------------------------
--
INIT_MMX
mmxext
cglobal
pred4x4_dc_8
,
3
,
5
...
...
@@ -2424,7 +2434,8 @@ cglobal pred4x4_dc_8, 3,5
RET
;-----------------------------------------------------------------------------
; void pred4x4_tm_vp8_8_mmxext(uint8_t *src, const uint8_t *topright, int stride)
; void ff_pred4x4_tm_vp8_8_mmxext(uint8_t *src, const uint8_t *topright,
; int stride)
;-----------------------------------------------------------------------------
%macro
PRED4x4_TM
0
...
...
@@ -2505,7 +2516,8 @@ cglobal pred4x4_tm_vp8_8, 3,3
RET
;-----------------------------------------------------------------------------
; void pred4x4_vertical_vp8_8_mmxext(uint8_t *src, const uint8_t *topright, int stride)
; void ff_pred4x4_vertical_vp8_8_mmxext(uint8_t *src, const uint8_t *topright,
; int stride)
;-----------------------------------------------------------------------------
INIT_MMX
mmxext
...
...
@@ -2525,7 +2537,8 @@ cglobal pred4x4_vertical_vp8_8, 3,3
RET
;-----------------------------------------------------------------------------
; void pred4x4_down_left_8_mmxext(uint8_t *src, const uint8_t *topright, int stride)
; void ff_pred4x4_down_left_8_mmxext(uint8_t *src, const uint8_t *topright,
; int stride)
;-----------------------------------------------------------------------------
INIT_MMX
mmxext
cglobal
pred4x4_down_left_8
,
3
,
3
...
...
@@ -2550,9 +2563,10 @@ cglobal pred4x4_down_left_8, 3,3
movd
[
r1
+
r2
*
2
]
,
m0
RET
;-----------------------------------------------------------------------------
; void pred4x4_vertical_left_8_mmxext(uint8_t *src, const uint8_t *topright, int stride)
;-----------------------------------------------------------------------------
;------------------------------------------------------------------------------
; void ff_pred4x4_vertical_left_8_mmxext(uint8_t *src, const uint8_t *topright,
; int stride)
;------------------------------------------------------------------------------
INIT_MMX
mmxext
cglobal
pred4x4_vertical_left_8
,
3
,
3
...
...
@@ -2575,9 +2589,10 @@ cglobal pred4x4_vertical_left_8, 3,3
movh
[
r1
+
r2
*
2
]
,
m0
RET
;-----------------------------------------------------------------------------
; void pred4x4_horizontal_up_8_mmxext(uint8_t *src, const uint8_t *topright, int stride)
;-----------------------------------------------------------------------------
;------------------------------------------------------------------------------
; void ff_pred4x4_horizontal_up_8_mmxext(uint8_t *src, const uint8_t *topright,
; int stride)
;------------------------------------------------------------------------------
INIT_MMX
mmxext
cglobal
pred4x4_horizontal_up_8
,
3
,
3
...
...
@@ -2608,9 +2623,10 @@ cglobal pred4x4_horizontal_up_8, 3,3
movd
[
r1
+
r2
*
2
]
,
m1
RET
;-----------------------------------------------------------------------------
; void pred4x4_horizontal_down_8_mmxext(uint8_t *src, const uint8_t *topright, int stride)
;-----------------------------------------------------------------------------
;------------------------------------------------------------------------------
; void ff_pred4x4_horizontal_down_8_mmxext(uint8_t *src,
; const uint8_t *topright, int stride)
;------------------------------------------------------------------------------
INIT_MMX
mmxext
cglobal
pred4x4_horizontal_down_8
,
3
,
3
...
...
@@ -2644,7 +2660,8 @@ cglobal pred4x4_horizontal_down_8, 3,3
RET
;-----------------------------------------------------------------------------
; void pred4x4_vertical_right_8_mmxext(uint8_t *src, const uint8_t *topright, int stride)
; void ff_pred4x4_vertical_right_8_mmxext(uint8_t *src,
; const uint8_t *topright, int stride)
;-----------------------------------------------------------------------------
INIT_MMX
mmxext
...
...
@@ -2674,7 +2691,8 @@ cglobal pred4x4_vertical_right_8, 3,3
RET
;-----------------------------------------------------------------------------
; void pred4x4_down_right_8_mmxext(uint8_t *src, const uint8_t *topright, int stride)
; void ff_pred4x4_down_right_8_mmxext(uint8_t *src, const uint8_t *topright,
; int stride)
;-----------------------------------------------------------------------------
INIT_MMX
mmxext
...
...
libavcodec/x86/h264_intrapred_10bit.asm
View file @
55519926
...
...
@@ -50,7 +50,7 @@ SECTION .text
%endmacro
;-----------------------------------------------------------------------------
; void pred4x4_down_right(pixel *src, const pixel *topright, int stride)
; void
ff_
pred4x4_down_right(pixel *src, const pixel *topright, int stride)
;-----------------------------------------------------------------------------
%macro
PRED4x4_DR
0
cglobal
pred4x4_down_right_10
,
3
,
3
...
...
@@ -85,9 +85,9 @@ PRED4x4_DR
INIT_XMM
avx
PRED4x4_DR
;-----------------------------------------------------------------------------
; void pred4x4_vertical_right(pixel *src, const pixel *topright, int stride)
;-----------------------------------------------------------------------------
;-----------------------------------------------------------------------------
-
; void
ff_
pred4x4_vertical_right(pixel *src, const pixel *topright, int stride)
;-----------------------------------------------------------------------------
-
%macro
PRED4x4_VR
0
cglobal
pred4x4_vertical_right_10
,
3
,
3
,
6
sub
r0
,
r2
...
...
@@ -122,9 +122,9 @@ PRED4x4_VR
INIT_XMM
avx
PRED4x4_VR
;-----------------------------------------------------------------------------
; void pred4x4_horizontal_down(pixel *src, const pixel *topright, int stride)
;-----------------------------------------------------------------------------
;-----------------------------------------------------------------------------
--
; void
ff_
pred4x4_horizontal_down(pixel *src, const pixel *topright, int stride)
;-----------------------------------------------------------------------------
--
%macro
PRED4x4_HD
0
cglobal
pred4x4_horizontal_down_10
,
3
,
3
sub
r0
,
r2
...
...
@@ -163,7 +163,7 @@ INIT_XMM avx
PRED4x4_HD
;-----------------------------------------------------------------------------
; void pred4x4_dc(pixel *src, const pixel *topright, int stride)
; void
ff_
pred4x4_dc(pixel *src, const pixel *topright, int stride)
;-----------------------------------------------------------------------------
%macro
HADDD
2
; sum junk
%if
mmsize
==
16
...
...
@@ -204,7 +204,7 @@ cglobal pred4x4_dc_10, 3, 3
RET
;-----------------------------------------------------------------------------
; void pred4x4_down_left(pixel *src, const pixel *topright, int stride)
; void
ff_
pred4x4_down_left(pixel *src, const pixel *topright, int stride)
;-----------------------------------------------------------------------------
%macro
PRED4x4_DL
0
cglobal
pred4x4_down_left_10
,
3
,
3
...
...
@@ -232,7 +232,7 @@ INIT_XMM avx
PRED4x4_DL
;-----------------------------------------------------------------------------
; void pred4x4_vertical_left(pixel *src, const pixel *topright, int stride)
; void
ff_
pred4x4_vertical_left(pixel *src, const pixel *topright, int stride)
;-----------------------------------------------------------------------------
%macro
PRED4x4_VL
0
cglobal
pred4x4_vertical_left_10
,
3
,
3
...
...
@@ -259,7 +259,7 @@ INIT_XMM avx
PRED4x4_VL
;-----------------------------------------------------------------------------
; void pred4x4_horizontal_up(pixel *src, const pixel *topright, int stride)
; void
ff_
pred4x4_horizontal_up(pixel *src, const pixel *topright, int stride)
;-----------------------------------------------------------------------------
INIT_MMX
mmxext
cglobal
pred4x4_horizontal_up_10
,
3
,
3
...
...
@@ -293,7 +293,7 @@ cglobal pred4x4_horizontal_up_10, 3, 3
;-----------------------------------------------------------------------------
; void pred8x8_vertical(pixel *src, int stride)
; void
ff_
pred8x8_vertical(pixel *src, int stride)
;-----------------------------------------------------------------------------
INIT_XMM
sse2
cglobal
pred8x8_vertical_10
,
2
,
2
...
...
@@ -309,7 +309,7 @@ cglobal pred8x8_vertical_10, 2, 2
RET
;-----------------------------------------------------------------------------
; void pred8x8_horizontal(pixel *src, int stride)
; void
ff_
pred8x8_horizontal(pixel *src, int stride)
;-----------------------------------------------------------------------------
INIT_XMM
sse2
cglobal
pred8x8_horizontal_10
,
2
,
3
...
...
@@ -329,7 +329,7 @@ cglobal pred8x8_horizontal_10, 2, 3
REP_RET
;-----------------------------------------------------------------------------
; void predict_8x8_dc(pixel *src, int stride)
; void
ff_
predict_8x8_dc(pixel *src, int stride)
;-----------------------------------------------------------------------------
%macro
MOV8
2
-
3
; sort of a hack, but it works
...
...
@@ -416,7 +416,7 @@ INIT_XMM sse2
PRED8x8_DC
pshuflw
;-----------------------------------------------------------------------------
; void pred8x8_top_dc(pixel *src, int stride)
; void
ff_
pred8x8_top_dc(pixel *src, int stride)
;-----------------------------------------------------------------------------
INIT_XMM
sse2
cglobal
pred8x8_top_dc_10
,
2
,
4
...
...
@@ -443,7 +443,7 @@ cglobal pred8x8_top_dc_10, 2, 4
RET
;-----------------------------------------------------------------------------
; void pred8x8_plane(pixel *src, int stride)
; void
ff_
pred8x8_plane(pixel *src, int stride)
;-----------------------------------------------------------------------------
INIT_XMM
sse2
cglobal
pred8x8_plane_10
,
2
,
7
,
7
...
...
@@ -506,7 +506,8 @@ cglobal pred8x8_plane_10, 2, 7, 7
;-----------------------------------------------------------------------------
; void pred8x8l_128_dc(pixel *src, int has_topleft, int has_topright, int stride)
; void ff_pred8x8l_128_dc(pixel *src, int has_topleft, int has_topright,
; int stride)
;-----------------------------------------------------------------------------
%macro
PRED8x8L_128_DC
0
cglobal
pred8x8l_128_dc_10
,
4
,
4
...
...
@@ -530,7 +531,8 @@ INIT_XMM sse2
PRED8x8L_128_DC
;-----------------------------------------------------------------------------
; void pred8x8l_top_dc(pixel *src, int has_topleft, int has_topright, int stride)
; void ff_pred8x8l_top_dc(pixel *src, int has_topleft, int has_topright,
; int stride)
;-----------------------------------------------------------------------------
%macro
PRED8x8L_TOP_DC
0
cglobal
pred8x8l_top_dc_10
,
4
,
4
,
6
...
...
@@ -566,9 +568,9 @@ PRED8x8L_TOP_DC
INIT_XMM
avx
PRED8x8L_TOP_DC
;-----------------------------------------------------------------------------
;
void
pred8x8l_dc(pixel *src, int has_topleft, int has_topright, int stride)
;-----------------------------------------------------------------------------
;-----------------------------------------------------------------------------
--
;
void ff_
pred8x8l_dc(pixel *src, int has_topleft, int has_topright, int stride)
;-----------------------------------------------------------------------------
--
;TODO: see if scalar is faster
%macro
PRED8x8L_DC
0
cglobal
pred8x8l_dc_10
,
4
,
6
,
6
...
...
@@ -624,7 +626,8 @@ INIT_XMM avx
PRED8x8L_DC
;-----------------------------------------------------------------------------
; void pred8x8l_vertical(pixel *src, int has_topleft, int has_topright, int stride)
; void ff_pred8x8l_vertical(pixel *src, int has_topleft, int has_topright,
; int stride)
;-----------------------------------------------------------------------------
%macro
PRED8x8L_VERTICAL
0
cglobal
pred8x8l_vertical_10
,
4
,
4
,
6
...
...
@@ -657,7 +660,8 @@ INIT_XMM avx
PRED8x8L_VERTICAL
;-----------------------------------------------------------------------------
; void pred8x8l_horizontal(uint8_t *src, int has_topleft, int has_topright, int stride)
; void ff_pred8x8l_horizontal(uint8_t *src, int has_topleft, int has_topright,
; int stride)
;-----------------------------------------------------------------------------
%macro
PRED8x8L_HORIZONTAL
0
cglobal
pred8x8l_horizontal_10
,
4
,
4
,
5
...
...
@@ -711,7 +715,8 @@ INIT_XMM avx
PRED8x8L_HORIZONTAL
;-----------------------------------------------------------------------------
;void pred8x8l_down_left(pixel *src, int has_topleft, int has_topright, int stride)
; void ff_pred8x8l_down_left(pixel *src, int has_topleft, int has_topright,
; int stride)
;-----------------------------------------------------------------------------
%macro
PRED8x8L_DOWN_LEFT
0
cglobal
pred8x8l_down_left_10
,
4
,
4
,
7
...
...
@@ -777,7 +782,8 @@ INIT_XMM avx
PRED8x8L_DOWN_LEFT
;-----------------------------------------------------------------------------
;void pred8x8l_down_right(pixel *src, int has_topleft, int has_topright, int stride)
; void ff_pred8x8l_down_right(pixel *src, int has_topleft, int has_topright,
; int stride)
;-----------------------------------------------------------------------------
%macro
PRED8x8L_DOWN_RIGHT
0
; standard forbids this when has_topleft is false
...
...
@@ -849,7 +855,8 @@ INIT_XMM avx
PRED8x8L_DOWN_RIGHT
;-----------------------------------------------------------------------------
; void pred8x8l_vertical_right(pixel *src, int has_topleft, int has_topright, int stride)
; void ff_pred8x8l_vertical_right(pixel *src, int has_topleft,
; int has_topright, int stride)
;-----------------------------------------------------------------------------
%macro
PRED8x8L_VERTICAL_RIGHT
0
; likewise with 8x8l_down_right
...
...
@@ -917,7 +924,8 @@ INIT_XMM avx
PRED8x8L_VERTICAL_RIGHT
;-----------------------------------------------------------------------------
; void pred8x8l_horizontal_up(pixel *src, int has_topleft, int has_topright, int stride)
; void ff_pred8x8l_horizontal_up(pixel *src, int has_topleft,
; int has_topright, int stride)
;-----------------------------------------------------------------------------
%macro
PRED8x8L_HORIZONTAL_UP
0
cglobal
pred8x8l_horizontal_up_10
,
4
,
4
,
6
...
...
@@ -977,7 +985,7 @@ PRED8x8L_HORIZONTAL_UP
;-----------------------------------------------------------------------------
; void pred16x16_vertical(pixel *src, int stride)
; void
ff_
pred16x16_vertical(pixel *src, int stride)
;-----------------------------------------------------------------------------
%macro
MOV16
3
-
5
mova
[
%1
+
0
]
,
%2
...
...
@@ -1013,7 +1021,7 @@ INIT_XMM sse2
PRED16x16_VERTICAL
;-----------------------------------------------------------------------------
; void pred16x16_horizontal(pixel *src, int stride)
; void
ff_
pred16x16_horizontal(pixel *src, int stride)
;-----------------------------------------------------------------------------
%macro
PRED16x16_HORIZONTAL
0
cglobal
pred16x16_horizontal_10
,
2
,
3
...
...
@@ -1037,7 +1045,7 @@ INIT_XMM sse2
PRED16x16_HORIZONTAL
;-----------------------------------------------------------------------------
; void pred16x16_dc(pixel *src, int stride)
; void
ff_
pred16x16_dc(pixel *src, int stride)
;-----------------------------------------------------------------------------
%macro
PRED16x16_DC
0
cglobal
pred16x16_dc_10
,
2
,
6
...
...
@@ -1083,7 +1091,7 @@ INIT_XMM sse2
PRED16x16_DC
;-----------------------------------------------------------------------------
; void pred16x16_top_dc(pixel *src, int stride)
; void
ff_
pred16x16_top_dc(pixel *src, int stride)
;-----------------------------------------------------------------------------
%macro
PRED16x16_TOP_DC
0
cglobal
pred16x16_top_dc_10
,
2
,
3
...
...
@@ -1115,7 +1123,7 @@ INIT_XMM sse2
PRED16x16_TOP_DC
;-----------------------------------------------------------------------------
; void pred16x16_left_dc(pixel *src, int stride)
; void
ff_
pred16x16_left_dc(pixel *src, int stride)
;-----------------------------------------------------------------------------
%macro
PRED16x16_LEFT_DC
0
cglobal
pred16x16_left_dc_10
,
2
,
6
...
...
@@ -1152,7 +1160,7 @@ INIT_XMM sse2
PRED16x16_LEFT_DC
;-----------------------------------------------------------------------------
; void pred16x16_128_dc(pixel *src, int stride)
; void
ff_
pred16x16_128_dc(pixel *src, int stride)
;-----------------------------------------------------------------------------
%macro
PRED16x16_128_DC
0
cglobal
pred16x16_128_dc_10
,
2
,
3
...
...
libavcodec/x86/h264_qpel_10bit.asm
View file @
55519926
...
...
@@ -167,7 +167,7 @@ stub_%1_h264_qpel%3_%2_10 %+ SUFFIX:
%endmacro
;-----------------------------------------------------------------------------
; void h264_qpel_mc00(uint8_t *dst, uint8_t *src, int stride)
; void
ff_
h264_qpel_mc00(uint8_t *dst, uint8_t *src, int stride)
;-----------------------------------------------------------------------------
%macro
COPY4
0
movu
m0
,
[
r1
]
...
...
@@ -221,7 +221,7 @@ MC00 put
MC00
avg
;-----------------------------------------------------------------------------
; void h264_qpel_mc20(uint8_t *dst, uint8_t *src, int stride)
; void
ff_
h264_qpel_mc20(uint8_t *dst, uint8_t *src, int stride)
;-----------------------------------------------------------------------------
%macro
MC_CACHE
1
%define
OP_MOV
mova
...
...
@@ -305,7 +305,7 @@ cglobal_mc %1, mc20, %2, 3,4,9
MC_CACHE
MC20
;-----------------------------------------------------------------------------
; void h264_qpel_mc30(uint8_t *dst, uint8_t *src, int stride)
; void
ff_
h264_qpel_mc30(uint8_t *dst, uint8_t *src, int stride)
;-----------------------------------------------------------------------------
%macro
MC30
2
cglobal_mc
%1
,
mc30
,
%2
,
3
,
5
,
9
...
...
@@ -316,7 +316,7 @@ cglobal_mc %1, mc30, %2, 3,5,9
MC_CACHE
MC30
;-----------------------------------------------------------------------------
; void h264_qpel_mc10(uint8_t *dst, uint8_t *src, int stride)
; void
ff_
h264_qpel_mc10(uint8_t *dst, uint8_t *src, int stride)
;-----------------------------------------------------------------------------
%macro
MC10
2
cglobal_mc
%1
,
mc10
,
%2
,
3
,
5
,
9
...
...
@@ -383,7 +383,7 @@ cglobal_mc %1, mc10, %2, 3,5,9
MC_CACHE
MC10
;-----------------------------------------------------------------------------
; void h264_qpel_mc02(uint8_t *dst, uint8_t *src, int stride)
; void
ff_
h264_qpel_mc02(uint8_t *dst, uint8_t *src, int stride)
;-----------------------------------------------------------------------------
%macro
V_FILT
10
v_filt
%9
_
%10
_10
...
...
@@ -432,7 +432,7 @@ cglobal_mc %1, mc02, %2, 3,4,8
MC
MC02
;-----------------------------------------------------------------------------
; void h264_qpel_mc01(uint8_t *dst, uint8_t *src, int stride)
; void
ff_
h264_qpel_mc01(uint8_t *dst, uint8_t *src, int stride)
;-----------------------------------------------------------------------------
%macro
MC01
2
cglobal_mc
%1
,
mc01
,
%2
,
3
,
5
,
8
...
...
@@ -458,7 +458,7 @@ cglobal_mc %1, mc01, %2, 3,5,8
MC
MC01
;-----------------------------------------------------------------------------
; void h264_qpel_mc03(uint8_t *dst, uint8_t *src, int stride)
; void
ff_
h264_qpel_mc03(uint8_t *dst, uint8_t *src, int stride)
;-----------------------------------------------------------------------------
%macro
MC03
2
cglobal_mc
%1
,
mc03
,
%2
,
3
,
5
,
8
...
...
@@ -469,7 +469,7 @@ cglobal_mc %1, mc03, %2, 3,5,8
MC
MC03
;-----------------------------------------------------------------------------
; void h264_qpel_mc11(uint8_t *dst, uint8_t *src, int stride)
; void
ff_
h264_qpel_mc11(uint8_t *dst, uint8_t *src, int stride)
;-----------------------------------------------------------------------------
%macro
H_FILT_AVG
2
-
3
h_filt
%1
_
%2
_10
:
...
...
@@ -551,7 +551,7 @@ cglobal_mc %1, mc11, %2, 3,6,8
MC
MC11
;-----------------------------------------------------------------------------
; void h264_qpel_mc31(uint8_t *dst, uint8_t *src, int stride)
; void
ff_
h264_qpel_mc31(uint8_t *dst, uint8_t *src, int stride)
;-----------------------------------------------------------------------------
%macro
MC31
2
cglobal_mc
%1
,
mc31
,
%2
,
3
,
6
,
8
...
...
@@ -563,7 +563,7 @@ cglobal_mc %1, mc31, %2, 3,6,8
MC
MC31
;-----------------------------------------------------------------------------
; void h264_qpel_mc13(uint8_t *dst, uint8_t *src, int stride)
; void
ff_
h264_qpel_mc13(uint8_t *dst, uint8_t *src, int stride)
;-----------------------------------------------------------------------------
%macro
MC13
2
cglobal_mc
%1
,
mc13
,
%2
,
3
,
7
,
12
...
...
@@ -574,7 +574,7 @@ cglobal_mc %1, mc13, %2, 3,7,12
MC
MC13
;-----------------------------------------------------------------------------
; void h264_qpel_mc33(uint8_t *dst, uint8_t *src, int stride)
; void
ff_
h264_qpel_mc33(uint8_t *dst, uint8_t *src, int stride)
;-----------------------------------------------------------------------------
%macro
MC33
2
cglobal_mc
%1
,
mc33
,
%2
,
3
,
6
,
8
...
...
@@ -586,7 +586,7 @@ cglobal_mc %1, mc33, %2, 3,6,8
MC
MC33
;-----------------------------------------------------------------------------
; void h264_qpel_mc22(uint8_t *dst, uint8_t *src, int stride)
; void
ff_
h264_qpel_mc22(uint8_t *dst, uint8_t *src, int stride)
;-----------------------------------------------------------------------------
%macro
FILT_H2
3
psubw
%1
,
%2
; a-b
...
...
@@ -757,7 +757,7 @@ cglobal_mc %1, mc22, %2, 3,7,12
MC
MC22
;-----------------------------------------------------------------------------
; void h264_qpel_mc12(uint8_t *dst, uint8_t *src, int stride)
; void
ff_
h264_qpel_mc12(uint8_t *dst, uint8_t *src, int stride)
;-----------------------------------------------------------------------------
%macro
MC12
2
cglobal_mc
%1
,
mc12
,
%2
,
3
,
7
,
12
...
...
@@ -802,7 +802,7 @@ cglobal_mc %1, mc12, %2, 3,7,12
MC
MC12
;-----------------------------------------------------------------------------
; void h264_qpel_mc32(uint8_t *dst, uint8_t *src, int stride)
; void
ff_
h264_qpel_mc32(uint8_t *dst, uint8_t *src, int stride)
;-----------------------------------------------------------------------------
%macro
MC32
2
cglobal_mc
%1
,
mc32
,
%2
,
3
,
7
,
12
...
...
@@ -820,7 +820,7 @@ cglobal_mc %1, mc32, %2, 3,7,12
MC
MC32
;-----------------------------------------------------------------------------
; void h264_qpel_mc21(uint8_t *dst, uint8_t *src, int stride)
; void
ff_
h264_qpel_mc21(uint8_t *dst, uint8_t *src, int stride)
;-----------------------------------------------------------------------------
%macro
H_NRD
1
put_h
%1
_10
:
...
...
@@ -873,7 +873,7 @@ cglobal_mc %1, mc21, %2, 3,7,12
MC
MC21
;-----------------------------------------------------------------------------
; void h264_qpel_mc23(uint8_t *dst, uint8_t *src, int stride)
; void
ff_
h264_qpel_mc23(uint8_t *dst, uint8_t *src, int stride)
;-----------------------------------------------------------------------------
%macro
MC23
2
cglobal_mc
%1
,
mc23
,
%2
,
3
,
7
,
12
...
...
libavcodec/x86/h264_weight.asm
View file @
55519926
...
...
@@ -28,12 +28,12 @@ SECTION .text
;-----------------------------------------------------------------------------
; biweight pred:
;
; void h264_biweight_16_sse2(uint8_t *dst, uint8_t *src, int stride,
; int height, int log2_denom, int weightd,
; int weights, int offset);
; void
ff_
h264_biweight_16_sse2(uint8_t *dst, uint8_t *src, int stride,
;
int height, int log2_denom, int weightd,
;
int weights, int offset);
; and
; void h264_weight_16_sse2(uint8_t *dst, int stride, int height,
; int log2_denom, int weight, int offset);
; void
ff_
h264_weight_16_sse2(uint8_t *dst, int stride, int height,
;
int log2_denom, int weight, int offset);
;-----------------------------------------------------------------------------
%macro
WEIGHT_SETUP
0
...
...
libavcodec/x86/h264_weight_10bit.asm
View file @
55519926
...
...
@@ -35,8 +35,8 @@ cextern pw_1
SECTION
.
text
;-----------------------------------------------------------------------------
; void
h264_weight(uint8_t *dst, int stride, int height, int log2_denom
,
; int weight, int offset);
; void
ff_h264_weight_16_10(uint8_t *dst, int stride, int height
,
;
int log2_denom,
int weight, int offset);
;-----------------------------------------------------------------------------
%macro
WEIGHT_PROLOGUE
0
.
prologue
:
...
...
@@ -151,8 +151,9 @@ WEIGHT_FUNC_HALF_MM
;-----------------------------------------------------------------------------
; void h264_biweight(uint8_t *dst, uint8_t *src, int stride, int height,
; int log2_denom, int weightd, int weights, int offset);
; void ff_h264_biweight_16_10(uint8_t *dst, uint8_t *src, int stride,
; int height, int log2_denom, int weightd,
; int weights, int offset);
;-----------------------------------------------------------------------------
%if
ARCH_X86_32
DECLARE_REG_TMP
3
...
...
libavcodec/x86/hpeldsp.asm
View file @
55519926
...
...
@@ -25,7 +25,7 @@ cextern pb_1
SECTION_TEXT
; put_pixels8_x2(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
;
void ff_
put_pixels8_x2(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
%macro
PUT_PIXELS8_X2
0
cglobal
put_pixels8_x2
,
4
,
5
lea
r4
,
[
r2
*
2
]
...
...
@@ -57,7 +57,7 @@ INIT_MMX 3dnow
PUT_PIXELS8_X2
; put_pixels16_x2(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
;
void ff_
put_pixels16_x2(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
%macro
PUT_PIXELS_16
0
cglobal
put_pixels16_x2
,
4
,
5
lea
r4
,
[
r2
*
2
]
...
...
@@ -101,7 +101,7 @@ INIT_MMX 3dnow
PUT_PIXELS_16
; put_no_rnd_pixels8_x2(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
;
void ff_
put_no_rnd_pixels8_x2(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
%macro
PUT_NO_RND_PIXELS8_X2
0
cglobal
put_no_rnd_pixels8_x2
,
4
,
5
mova
m6
,
[
pb_1
]
...
...
@@ -142,7 +142,7 @@ INIT_MMX 3dnow
PUT_NO_RND_PIXELS8_X2
; put_no_rnd_pixels8_x2_exact(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
;
void ff_
put_no_rnd_pixels8_x2_exact(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
%macro
PUT_NO_RND_PIXELS8_X2_EXACT
0
cglobal
put_no_rnd_pixels8_x2_exact
,
4
,
5
lea
r4
,
[
r2
*
3
]
...
...
@@ -189,7 +189,7 @@ INIT_MMX 3dnow
PUT_NO_RND_PIXELS8_X2_EXACT
; put_pixels8_y2(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
;
void ff_
put_pixels8_y2(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
%macro
PUT_PIXELS8_Y2
0
cglobal
put_pixels8_y2
,
4
,
5
lea
r4
,
[
r2
*
2
]
...
...
@@ -223,7 +223,7 @@ INIT_MMX 3dnow
PUT_PIXELS8_Y2
; put_no_rnd_pixels8_y2(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
;
void ff_
put_no_rnd_pixels8_y2(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
%macro
PUT_NO_RND_PIXELS8_Y2
0
cglobal
put_no_rnd_pixels8_y2
,
4
,
5
mova
m6
,
[
pb_1
]
...
...
@@ -260,7 +260,7 @@ INIT_MMX 3dnow
PUT_NO_RND_PIXELS8_Y2
; put_no_rnd_pixels8_y2_exact(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
;
void ff_
put_no_rnd_pixels8_y2_exact(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
%macro
PUT_NO_RND_PIXELS8_Y2_EXACT
0
cglobal
put_no_rnd_pixels8_y2_exact
,
4
,
5
lea
r4
,
[
r2
*
3
]
...
...
@@ -302,7 +302,7 @@ INIT_MMX 3dnow
PUT_NO_RND_PIXELS8_Y2_EXACT
; avg_pixels8(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
;
void ff_
avg_pixels8(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
%macro
AVG_PIXELS8
0
cglobal
avg_pixels8
,
4
,
5
lea
r4
,
[
r2
*
2
]
...
...
@@ -332,7 +332,7 @@ INIT_MMX 3dnow
AVG_PIXELS8
; avg_pixels8_x2(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
;
void ff_
avg_pixels8_x2(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
%macro
AVG_PIXELS8_X2
0
cglobal
avg_pixels8_x2
,
4
,
5
lea
r4
,
[
r2
*
2
]
...
...
@@ -368,7 +368,7 @@ INIT_MMX 3dnow
AVG_PIXELS8_X2
; avg_pixels8_y2(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
;
void ff_
avg_pixels8_y2(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
%macro
AVG_PIXELS8_Y2
0
cglobal
avg_pixels8_y2
,
4
,
5
lea
r4
,
[
r2
*
2
]
...
...
@@ -410,7 +410,7 @@ INIT_MMX 3dnow
AVG_PIXELS8_Y2
; avg_pixels8_xy2(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
;
void ff_
avg_pixels8_xy2(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
%macro
AVG_PIXELS8_XY2
0
cglobal
avg_pixels8_xy2
,
4
,
5
mova
m6
,
[
pb_1
]
...
...
libavcodec/x86/mpeg4qpel.asm
View file @
55519926
...
...
@@ -31,7 +31,7 @@ cextern pw_20
SECTION_TEXT
; put_no_rnd_pixels8_l2(uint8_t *dst, uint8_t *src1, uint8_t *src2, int dstStride, int src1Stride, int h)
;
void ff_
put_no_rnd_pixels8_l2(uint8_t *dst, uint8_t *src1, uint8_t *src2, int dstStride, int src1Stride, int h)
%macro
PUT_NO_RND_PIXELS8_L2
0
cglobal
put_no_rnd_pixels8_l2
,
6
,
6
movsxdifnidn
r4
,
r4d
...
...
@@ -97,7 +97,7 @@ INIT_MMX mmxext
PUT_NO_RND_PIXELS8_L2
; put_no_rnd_pixels16_l2(uint8_t *dst, uint8_t *src1, uint8_t *src2, int dstStride, int src1Stride, int h)
;
void ff_
put_no_rnd_pixels16_l2(uint8_t *dst, uint8_t *src1, uint8_t *src2, int dstStride, int src1Stride, int h)
%macro
PUT_NO_RND_PIXELS16_l2
0
cglobal
put_no_rnd_pixels16_l2
,
6
,
6
movsxdifnidn
r3
,
r3d
...
...
libavcodec/x86/proresdsp.asm
View file @
55519926
...
...
@@ -326,8 +326,8 @@ section .text align=16
SUMSUB_SHPK
m2
,
m3
,
m4
,
m5
,
m6
,
m7
,
%2
%endmacro
; void prores_idct_put_10_<opt>(uint8_t *pixels, int stride,
; int16_t *block, const int16_t *qmat);
; void
ff_
prores_idct_put_10_<opt>(uint8_t *pixels, int stride,
;
int16_t *block, const int16_t *qmat);
%macro
idct_put_fn
1
cglobal
prores_idct_put_10
,
4
,
4
,
%1
movsxd
r1
,
r1d
...
...
libavcodec/x86/qpel.asm
View file @
55519926
...
...
@@ -44,7 +44,8 @@ SECTION .text
mova
%2
,
%1
%endmacro
; void pixels4_l2_mmxext(uint8_t *dst, uint8_t *src1, uint8_t *src2, int dstStride, int src1Stride, int h)
; void ff_put/avg_pixels4_l2_mmxext(uint8_t *dst, uint8_t *src1, uint8_t *src2,
; int dstStride, int src1Stride, int h)
%macro
PIXELS4_L2
1
%define
OP
op_
%1
h
cglobal
%1
_pixels4_l2
,
6
,
6
...
...
@@ -87,7 +88,8 @@ INIT_MMX mmxext
PIXELS4_L2
put
PIXELS4_L2
avg
; void pixels8_l2_mmxext(uint8_t *dst, uint8_t *src1, uint8_t *src2, int dstStride, int src1Stride, int h)
; void ff_put/avg_pixels8_l2_mmxext(uint8_t *dst, uint8_t *src1, uint8_t *src2,
; int dstStride, int src1Stride, int h)
%macro
PIXELS8_L2
1
%define
OP
op_
%1
cglobal
%1
_pixels8_l2
,
6
,
6
...
...
@@ -130,7 +132,8 @@ INIT_MMX mmxext
PIXELS8_L2
put
PIXELS8_L2
avg
; void pixels16_l2_mmxext(uint8_t *dst, uint8_t *src1, uint8_t *src2, int dstStride, int src1Stride, int h)
; void ff_put/avg_pixels16_l2_mmxext(uint8_t *dst, uint8_t *src1, uint8_t *src2,
; int dstStride, int src1Stride, int h)
%macro
PIXELS16_L2
1
%define
OP
op_
%1
cglobal
%1
_pixels16_l2
,
6
,
6
...
...
libavcodec/x86/rv40dsp.asm
View file @
55519926
...
...
@@ -77,9 +77,9 @@ SECTION .text
;-----------------------------------------------------------------------------
; subpel MC functions:
;
; void [put|rv40]_rv40_qpel_[h|v]_<opt>(uint8_t *dst, int deststride,
; uint8_t *src, int srcstride,
; int len, int m);
; void
ff_
[put|rv40]_rv40_qpel_[h|v]_<opt>(uint8_t *dst, int deststride,
;
uint8_t *src, int srcstride,
;
int len, int m);
;----------------------------------------------------------------------
%macro
LOAD
2
%if
WIN64
...
...
@@ -438,7 +438,7 @@ FILTER_SSSE3 avg
%endmacro
; rv40_weight_func_%1(uint8_t *dst, uint8_t *src1, uint8_t *src2, int w1, int w2, int stride)
;
void ff_
rv40_weight_func_%1(uint8_t *dst, uint8_t *src1, uint8_t *src2, int w1, int w2, int stride)
; %1=size %2=num of xmm regs
; The weights are FP0.14 notation of fractions depending on pts.
; For timebases without rounding error (i.e. PAL), the fractions
...
...
libavcodec/x86/sbrdsp.asm
View file @
55519926
...
...
@@ -118,9 +118,9 @@ cglobal sbr_hf_g_filt, 5, 6, 5
.
end
:
RET
;
static void sbr_hf_gen_c
(float (*X_high)[2], const float (*X_low)[2],
;
const float alpha0[2], const float alpha1[2],
;
float bw, int start, int end)
;
void ff_sbr_hf_gen_sse
(float (*X_high)[2], const float (*X_low)[2],
; const float alpha0[2], const float alpha1[2],
; float bw, int start, int end)
;
cglobal
sbr_hf_gen
,
4
,
4
,
8
,
X_high
,
X_low
,
alpha0
,
alpha1
,
BW
,
S
,
E
; load alpha factors
...
...
@@ -247,7 +247,7 @@ cglobal sbr_neg_odd_64, 1,2,4,z
REP_RET
INIT_XMM
sse2
;
sbr_qmf_deint_bfly
(float *v, const float *src0, const float *src1)
;
void ff_sbr_qmf_deint_bfly_sse2
(float *v, const float *src0, const float *src1)
cglobal
sbr_qmf_deint_bfly
,
3
,
5
,
8
,
v
,
src0
,
src1
,
vrev
,
c
mov
cq
,
64
*
4
-
2
*
mmsize
lea
vrevq
,
[
vq
+
64
*
4
]
...
...
libavcodec/x86/vp8dsp.asm
View file @
55519926
...
...
@@ -153,13 +153,13 @@ cextern pw_64
SECTION
.
text
;-----------------------------------------------------------------------------
;-----------------------------------------------------------------------------
--
; subpel MC functions:
;
; void put_vp8_epel<size>_h<htap>v<vtap>_<opt>(uint8_t *dst, int deststride,
; uint8_t *src, int srcstride,
; int height, int mx, int my);
;-----------------------------------------------------------------------------
; void
ff_
put_vp8_epel<size>_h<htap>v<vtap>_<opt>(uint8_t *dst, int deststride,
;
uint8_t *src, int srcstride,
;
int height, int mx, int my);
;-----------------------------------------------------------------------------
--
%macro
FILTER_SSSE3
1
cglobal
put_vp8_epel
%1
_h6
,
6
,
6
+
npicregs
,
8
,
dst
,
dststride
,
src
,
srcstride
,
height
,
mx
,
picreg
...
...
@@ -884,7 +884,7 @@ cglobal put_vp8_pixels16, 5, 5, 2, dst, dststride, src, srcstride, height
REP_RET
;-----------------------------------------------------------------------------
; void vp8_idct_dc_add_<opt>(uint8_t *dst, int16_t block[16], int stride);
; void
ff_
vp8_idct_dc_add_<opt>(uint8_t *dst, int16_t block[16], int stride);
;-----------------------------------------------------------------------------
%macro
ADD_DC
4
...
...
@@ -962,7 +962,7 @@ cglobal vp8_idct_dc_add, 3, 3, 6, dst, block, stride
RET
;-----------------------------------------------------------------------------
; void vp8_idct_dc_add4y_<opt>(uint8_t *dst, int16_t block[4][16], int stride);
; void
ff_
vp8_idct_dc_add4y_<opt>(uint8_t *dst, int16_t block[4][16], int stride);
;-----------------------------------------------------------------------------
%if
ARCH_X86_32
...
...
@@ -1035,7 +1035,7 @@ cglobal vp8_idct_dc_add4y, 3, 3, 6, dst, block, stride
RET
;-----------------------------------------------------------------------------
; void vp8_idct_dc_add4uv_<opt>(uint8_t *dst, int16_t block[4][16], int stride);
; void
ff_
vp8_idct_dc_add4uv_<opt>(uint8_t *dst, int16_t block[4][16], int stride);
;-----------------------------------------------------------------------------
INIT_MMX
mmx
...
...
@@ -1077,7 +1077,7 @@ cglobal vp8_idct_dc_add4uv, 3, 3, 0, dst, block, stride
RET
;-----------------------------------------------------------------------------
; void vp8_idct_add_<opt>(uint8_t *dst, int16_t block[16], int stride);
; void
ff_
vp8_idct_add_<opt>(uint8_t *dst, int16_t block[16], int stride);
;-----------------------------------------------------------------------------
; calculate %1=mul_35468(%1)-mul_20091(%2); %2=mul_20091(%1)+mul_35468(%2)
...
...
@@ -1157,7 +1157,7 @@ INIT_MMX sse
VP8_IDCT_ADD
;-----------------------------------------------------------------------------
; void
vp8_luma_dc_wht_mmxex
t(int16_t block[4][4][16], int16_t dc[16])
; void
ff_vp8_luma_dc_wh
t(int16_t block[4][4][16], int16_t dc[16])
;-----------------------------------------------------------------------------
%macro
SCATTER_WHT
3
...
...
libavcodec/x86/vp8dsp_loopfilter.asm
View file @
55519926
...
...
@@ -43,7 +43,7 @@ cextern pb_80
SECTION
.
text
;-----------------------------------------------------------------------------
; void vp8_h/v_loop_filter_simple_<opt>(uint8_t *dst, int stride, int flim);
; void
ff_
vp8_h/v_loop_filter_simple_<opt>(uint8_t *dst, int stride, int flim);
;-----------------------------------------------------------------------------
; macro called with 7 mm register indexes as argument, and 4 regular registers
...
...
@@ -429,8 +429,8 @@ INIT_XMM sse4
SIMPLE_LOOPFILTER
h
,
5
;-----------------------------------------------------------------------------
; void vp8_h/v_loop_filter<size>_inner_<opt>(uint8_t *dst, [uint8_t *v,] int stride,
; int flimE, int flimI, int hev_thr);
; void
ff_
vp8_h/v_loop_filter<size>_inner_<opt>(uint8_t *dst, [uint8_t *v,] int stride,
;
int flimE, int flimI, int hev_thr);
;-----------------------------------------------------------------------------
%macro
INNER_LOOPFILTER
2
...
...
@@ -921,8 +921,8 @@ INNER_LOOPFILTER v, 8
INNER_LOOPFILTER
h
,
8
;-----------------------------------------------------------------------------
; void vp8_h/v_loop_filter<size>_mbedge_<opt>(uint8_t *dst, [uint8_t *v,] int stride,
; int flimE, int flimI, int hev_thr);
; void
ff_
vp8_h/v_loop_filter<size>_mbedge_<opt>(uint8_t *dst, [uint8_t *v,] int stride,
;
int flimE, int flimI, int hev_thr);
;-----------------------------------------------------------------------------
%macro
MBEDGE_LOOPFILTER
2
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment