Commit 1acffaf8 authored by mamonet's avatar mamonet

[PowerPC] Reverse the order of storing non-volatile vector registers

parent 5ff18cd1
Pipeline #56350 passed with stages
in 3 minutes and 5 seconds
......@@ -195,16 +195,16 @@ endfunc
function deblock_h_chroma_altivec
h264_loop_filter_start
subi 3,3,4
subi 9,1,32
subi 9,1,16
stvx 31,0,9
addi 9,9,16
subi 9,9,16
stvx 30,0,9
VEC_LOAD_DATA 31,.trn_even_halfword_mask,10
VEC_LOAD_DATA 30,.trn_odd_halfword_mask,9
deblock_h_chroma
subi 9,1,32
subi 9,1,16
lvx 31,0,9
addi 9,9,16
subi 9,9,16
lvx 30,0,9
blr
endfunc
......@@ -212,9 +212,9 @@ endfunc
function deblock_h_chroma_422_altivec
h264_loop_filter_start
add 7,3,4
subi 9,1,32
subi 9,1,16
stvx 31,0,9
addi 9,9,16
subi 9,9,16
stvx 30,0,9
subi 3,3,4
VEC_LOAD_DATA 31,.trn_even_halfword_mask,10
......@@ -225,9 +225,9 @@ function deblock_h_chroma_422_altivec
subi 3,7,4
vsldoi 14,14,14,4
deblock_h_chroma
subi 9,1,32
subi 9,1,16
lvx 31,0,9
addi 9,9,16
subi 9,9,16
lvx 30,0,9
blr
endfunc
......
......@@ -816,56 +816,56 @@ function mbtree_propagate_cost_altivec
endfunc
.macro mbtree_propagate_list_internal_prologue
subi 10,1,192
subi 10,1,16
stvx 31,0,10
addi 10,10,16
subi 10,10,16
stvx 30,0,10
addi 10,10,16
subi 10,10,16
stvx 29,0,10
addi 10,10,16
subi 10,10,16
stvx 28,0,10
addi 10,10,16
subi 10,10,16
stvx 27,0,10
addi 10,10,16
subi 10,10,16
stvx 26,0,10
addi 10,10,16
subi 10,10,16
stvx 25,0,10
addi 10,10,16
subi 10,10,16
stvx 24,0,10
addi 10,10,16
subi 10,10,16
stvx 23,0,10
addi 10,10,16
subi 10,10,16
stvx 22,0,10
addi 10,10,16
subi 10,10,16
stvx 21,0,10
addi 10,10,16
subi 10,10,16
stvx 20,0,10
.endm
.macro mbtree_propagate_list_internal_epilogue
subi 10,1,192
subi 10,1,16
lvx 31,0,10
addi 10,10,16
subi 10,10,16
lvx 30,0,10
addi 10,10,16
subi 10,10,16
lvx 29,0,10
addi 10,10,16
subi 10,10,16
lvx 28,0,10
addi 10,10,16
subi 10,10,16
lvx 27,0,10
addi 10,10,16
subi 10,10,16
lvx 26,0,10
addi 10,10,16
subi 10,10,16
lvx 25,0,10
addi 10,10,16
subi 10,10,16
lvx 24,0,10
addi 10,10,16
subi 10,10,16
lvx 23,0,10
addi 10,10,16
subi 10,10,16
lvx 22,0,10
addi 10,10,16
subi 10,10,16
lvx 21,0,10
addi 10,10,16
subi 10,10,16
lvx 20,0,10
.endm
......
......@@ -528,30 +528,30 @@ endfunc
.macro sa8d_satd_8x8_prologue satd=
.ifc \satd, satd
subi 10,1,112
subi 10,1,16
stvx 31,0,10
addi 10,10,16
subi 10,10,16
stvx 30,0,10
addi 10,10,16
subi 10,10,16
stvx 29,0,10
addi 10,10,16
subi 10,10,16
stvx 28,0,10
addi 10,10,16
subi 10,10,16
stvx 27,0,10
addi 10,10,16
subi 10,10,16
stvx 26,0,10
addi 10,10,16
subi 10,10,16
stvx 25,0,10
vxor 25,25,25
.set sa8d_satd_8x8_zero,25
.else
subi 10,1,64
subi 10,1,16
stvx 31,0,10
addi 10,10,16
subi 10,10,16
stvx 30,0,10
addi 10,10,16
subi 10,10,16
stvx 29,0,10
addi 10,10,16
subi 10,10,16
stvx 28,0,10
vxor 18,18,18
.set sa8d_satd_8x8_zero,18
......@@ -562,28 +562,28 @@ endfunc
.macro sa8d_satd_8x8_epilogue satd=
.ifc \satd, satd
subi 10,1,112
subi 10,1,16
lvx 31,0,10
addi 10,10,16
subi 10,10,16
lvx 30,0,10
addi 10,10,16
subi 10,10,16
lvx 29,0,10
addi 10,10,16
subi 10,10,16
lvx 28,0,10
addi 10,10,16
subi 10,10,16
lvx 27,0,10
addi 10,10,16
subi 10,10,16
lvx 26,0,10
addi 10,10,16
subi 10,10,16
lvx 25,0,10
.else
subi 10,1,64
subi 10,1,16
lvx 31,0,10
addi 10,10,16
subi 10,10,16
lvx 30,0,10
addi 10,10,16
subi 10,10,16
lvx 29,0,10
addi 10,10,16
subi 10,10,16
lvx 28,0,10
.endif
.endm
......
......@@ -291,10 +291,10 @@ endfunc
.endm
.macro coeff_level_run shift
std 28,-8(1)
std 29,-16(1)
std 30,-24(1)
std 31,-32(1)
std 31,-8(1)
std 30,-16(1)
std 29,-24(1)
std 28,-32(1)
cntlzd 30,5
srwi 31,30,\shift
li 28,~((1 << \shift) - 1)
......@@ -320,10 +320,10 @@ endfunc
2:
stw 8,4(4)
extsw 3,7
ld 28,-8(1)
ld 29,-16(1)
ld 30,-24(1)
ld 31,-32(1)
ld 31,-8(1)
ld 30,-16(1)
ld 29,-24(1)
ld 28,-32(1)
.endm
#ifndef WORDS_BIGENDIAN
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment