20 |
# $Date$ |
# $Date$ |
21 |
# $Author$ |
# $Author$ |
22 |
# |
# |
23 |
# This is my first PPC ASM program. So I might do nasty things. |
# This is my first PPC ASM attempt. So I might do nasty things. |
24 |
# Please send any comments to guillaume@morinfr.org |
# Please send any comments to <guillaume@morinfr.org> |
25 |
|
|
26 |
|
|
27 |
# Returns a field of bits that indicates non zero ac blocks |
# Returns a field of bits that indicates non zero ac blocks |
50 |
# |
# |
51 |
#} |
#} |
52 |
|
|
53 |
|
.data |
54 |
|
.skip: |
55 |
|
.word 0,-1 |
56 |
|
.align 4 |
57 |
|
|
58 |
.text |
.text |
59 |
.global calc_cbp_ppc |
.global calc_cbp_ppc |
60 |
calc_cbp_ppc: |
calc_cbp_ppc: |
61 |
# r9 will contain coeffs addr |
# r9 will contain coeffs addr |
62 |
mr 9,3 |
mr 9,3 |
63 |
# r8 is the loop counter |
# r8 is the loop counter (rows) |
64 |
li 8,5 |
li 8,5 |
65 |
# r3 contains the result, therefore we set it to 0 |
# r3 contains the result, therefore we set it to 0 |
66 |
xor 3,3,3 |
li 3,0 |
67 |
.loop: |
.loop: |
68 |
# r7 is the loop2 counter, FIXME: use CTR |
# CTR is the loop2 counter |
69 |
li 7,14 |
li 4,16 |
70 |
|
mtctr 4 |
71 |
# r6 is coeff pointer for this line |
# r6 is coeff pointer for this line |
72 |
mr 6,9 |
mr 6,9 |
73 |
|
lis 7,.skip@ha |
74 |
|
addi 7,7,.skip@l |
75 |
|
lwz 7,0(7) |
76 |
.loop2: |
.loop2: |
77 |
# coeffs is a matrix of 16 bits cells |
# coeffs is a matrix of 16 bits cells |
78 |
lha 4,2(6) |
lwz 4,0(6) |
79 |
lha 5,4(6) |
and 4,4,7 |
80 |
or 4,5,4 |
li 7,-1 |
81 |
lha 5,6(6) |
|
82 |
or 4,5,4 |
lwz 5,4(6) |
|
lha 5,8(6) |
|
83 |
# or. updates CR0 |
# or. updates CR0 |
84 |
or. 4,5,4 |
or. 4,5,4 |
85 |
# testing bit 2 (is zero) of CR0 |
# testing bit 2 (is zero) of CR0 |
86 |
bc 4,2,.cbp |
bf 2,.cbp |
87 |
addi 6,6,8 |
addi 6,6,8 |
88 |
# subic. updates CR0 |
bdnz .loop2 |
89 |
subic. 7,7,1 |
b .newline |
|
# testing bit 0 (is negative) of CR0 |
|
|
bc 12,0,.lastcoeffs |
|
|
b .loop2 |
|
|
.lastcoeffs: |
|
|
lha 4,2(6) |
|
|
lha 5,4(6) |
|
|
or 4,5,4 |
|
|
lha 5,6(6) |
|
|
# or. updates CR0 |
|
|
or. 4,5,4 |
|
|
# testing bit 2 (is zero) of CR0 |
|
|
bc 12,2,.newline |
|
90 |
.cbp: |
.cbp: |
91 |
li 4,1 |
li 4,1 |
92 |
slw 4,4,8 |
slw 4,4,8 |
93 |
or 3,3,4 |
or 3,3,4 |
|
b .newline |
|
94 |
.newline: |
.newline: |
95 |
addi 9,9,128 |
addi 9,9,128 |
96 |
# updates CR0, blabla |
# updates CR0, blabla |
97 |
subic. 8,8,1 |
subic. 8,8,1 |
98 |
bc 4,0,.loop |
bf 0,.loop |
|
.end: |
|
99 |
blr |
blr |