Parent Directory | Revision Log
Revision 1.1 - (view) (download)
1 : | ia64p | 1.1 | .file "quant_h263.c" |
2 : | .pred.safe_across_calls p1-p5,p16-p63 | ||
3 : | .section .rodata | ||
4 : | .align 4 | ||
5 : | .type multipliers#,@object | ||
6 : | .size multipliers#,128 | ||
7 : | multipliers: | ||
8 : | data4 0 | ||
9 : | data4 32769 | ||
10 : | data4 16385 | ||
11 : | data4 10923 | ||
12 : | data4 8193 | ||
13 : | data4 6554 | ||
14 : | data4 5462 | ||
15 : | data4 4682 | ||
16 : | data4 4097 | ||
17 : | data4 3641 | ||
18 : | data4 3277 | ||
19 : | data4 2979 | ||
20 : | data4 2731 | ||
21 : | data4 2521 | ||
22 : | data4 2341 | ||
23 : | data4 2185 | ||
24 : | data4 2049 | ||
25 : | data4 1928 | ||
26 : | data4 1821 | ||
27 : | data4 1725 | ||
28 : | data4 1639 | ||
29 : | data4 1561 | ||
30 : | data4 1490 | ||
31 : | data4 1425 | ||
32 : | data4 1366 | ||
33 : | data4 1311 | ||
34 : | data4 1261 | ||
35 : | data4 1214 | ||
36 : | data4 1171 | ||
37 : | data4 1130 | ||
38 : | data4 1093 | ||
39 : | data4 1058 | ||
40 : | .global __divdi3# | ||
41 : | .text | ||
42 : | .align 16 | ||
43 : | .global quant_intra_ia64# | ||
44 : | .proc quant_intra_ia64# | ||
45 : | quant_intra_ia64: | ||
46 : | .prologue //12, 37 | ||
47 : | .save ar.pfs, r38 | ||
48 : | alloc r38 = ar.pfs, 4, 3, 2, 0 | ||
49 : | adds r16 = -8, r12 | ||
50 : | .fframe 32 | ||
51 : | adds r12 = -32, r12 | ||
52 : | mov r17 = ar.lc | ||
53 : | addl r14 = @ltoff(multipliers#), gp | ||
54 : | ld2 r15 = [r33] | ||
55 : | ;; | ||
56 : | .savesp ar.lc, 24 | ||
57 : | st8 [r16] = r17, 8 | ||
58 : | ld8 r14 = [r14] | ||
59 : | sxt2 r15 = r15 | ||
60 : | ;; | ||
61 : | .save.f 0x1 | ||
62 : | stf.spill [r16] = f2 | ||
63 : | .save rp, r37 | ||
64 : | mov r37 = b0 | ||
65 : | .body | ||
66 : | dep.z r36 = r34, 1, 15 | ||
67 : | dep.z r16 = r34, 2, 32 | ||
68 : | cmp4.ge p6, p7 = 0, r15 | ||
69 : | ;; | ||
70 : | add r16 = r16, r14 | ||
71 : | ;; | ||
72 : | ld4 r16 = [r16] | ||
73 : | ;; | ||
74 : | setf.sig f2 = r16 | ||
75 : | (p6) br.cond.dptk .L4 | ||
76 : | extr r39 = r35, 1, 31 | ||
77 : | sxt4 r40 = r35 | ||
78 : | ;; | ||
79 : | add r39 = r39, r15 | ||
80 : | br .L38 | ||
81 : | ;; | ||
82 : | .L4: | ||
83 : | extr r39 = r35, 1, 31 | ||
84 : | sxt4 r40 = r35 | ||
85 : | ;; | ||
86 : | sub r39 = r15, r39 | ||
87 : | ;; | ||
88 : | .L38: | ||
89 : | sxt4 r39 = r39 | ||
90 : | br.call.sptk.many b0 = __divdi3# | ||
91 : | ;; | ||
92 : | addl r16 = 2, r0 | ||
93 : | st2 [r32] = r8 | ||
94 : | addl r17 = 1, r0 | ||
95 : | ;; | ||
96 : | add r14 = r33, r16 | ||
97 : | ;; | ||
98 : | ld2 r15 = [r14] | ||
99 : | ;; | ||
100 : | sxt2 r15 = r15 | ||
101 : | ;; | ||
102 : | mov r14 = r15 | ||
103 : | ;; | ||
104 : | cmp4.le p6, p7 = r0, r14 | ||
105 : | (p6) br.cond.dptk .L21 | ||
106 : | sub r14 = r0, r14 | ||
107 : | ;; | ||
108 : | sxt2 r14 = r14 | ||
109 : | ;; | ||
110 : | cmp4.le p6, p7 = r36, r14 | ||
111 : | ;; | ||
112 : | (p7) add r14 = r32, r16 | ||
113 : | (p6) add r15 = r32, r16 | ||
114 : | (p6) setf.sig f6 = r14 | ||
115 : | ;; | ||
116 : | (p7) st2 [r14] = r0 | ||
117 : | (p6) xma.l f6 = f6, f2, f0 | ||
118 : | ;; | ||
119 : | (p6) getf.sig r14 = f6 | ||
120 : | ;; | ||
121 : | (p6) extr r14 = r14, 16, 16 | ||
122 : | ;; | ||
123 : | (p6) sub r14 = r0, r14 | ||
124 : | br .L39 | ||
125 : | ;; | ||
126 : | .L21: | ||
127 : | cmp4.le p6, p7 = r36, r14 | ||
128 : | ;; | ||
129 : | (p7) add r14 = r32, r16 | ||
130 : | (p6) setf.sig f6 = r15 | ||
131 : | ;; | ||
132 : | (p7) st2 [r14] = r0 | ||
133 : | (p6) xma.l f6 = f6, f2, f0 | ||
134 : | (p6) add r15 = r32, r16 | ||
135 : | ;; | ||
136 : | (p6) getf.sig r14 = f6 | ||
137 : | ;; | ||
138 : | (p6) extr r14 = r14, 16, 16 | ||
139 : | .L39: | ||
140 : | //.pred.rel.mutex p6, p7 | ||
141 : | ;; | ||
142 : | (p6) st2 [r15] = r14 | ||
143 : | adds r17 = 1, r17 | ||
144 : | ;; | ||
145 : | cmp4.geu p6, p7 = 63, r17 | ||
146 : | (p7) br.cond.dptk .L16 | ||
147 : | addl r14 = 30, r0 | ||
148 : | ;; | ||
149 : | mov ar.lc = r14 | ||
150 : | ;; | ||
151 : | .L37: | ||
152 : | dep.z r16 = r17, 1, 32 | ||
153 : | ;; | ||
154 : | add r14 = r16, r33 | ||
155 : | ;; | ||
156 : | ld2 r15 = [r14] | ||
157 : | ;; | ||
158 : | sxt2 r15 = r15 | ||
159 : | ;; | ||
160 : | mov r14 = r15 | ||
161 : | ;; | ||
162 : | cmp4.le p6, p7 = r0, r14 | ||
163 : | (p6) br.cond.dptk .L27 | ||
164 : | sub r14 = r0, r14 | ||
165 : | ;; | ||
166 : | sxt2 r14 = r14 | ||
167 : | ;; | ||
168 : | cmp4.le p6, p7 = r36, r14 | ||
169 : | ;; | ||
170 : | (p7) add r14 = r16, r32 | ||
171 : | (p6) add r15 = r16, r32 | ||
172 : | (p6) setf.sig f6 = r14 | ||
173 : | ;; | ||
174 : | (p7) st2 [r14] = r0 | ||
175 : | (p6) xma.l f6 = f6, f2, f0 | ||
176 : | ;; | ||
177 : | (p6) getf.sig r14 = f6 | ||
178 : | ;; | ||
179 : | (p6) extr r14 = r14, 16, 16 | ||
180 : | ;; | ||
181 : | (p6) sub r14 = r0, r14 | ||
182 : | br .L40 | ||
183 : | ;; | ||
184 : | .L27: | ||
185 : | cmp4.le p6, p7 = r36, r14 | ||
186 : | ;; | ||
187 : | (p7) add r14 = r16, r32 | ||
188 : | (p6) setf.sig f6 = r15 | ||
189 : | ;; | ||
190 : | (p7) st2 [r14] = r0 | ||
191 : | (p6) xma.l f6 = f6, f2, f0 | ||
192 : | (p6) add r15 = r16, r32 | ||
193 : | ;; | ||
194 : | (p6) getf.sig r14 = f6 | ||
195 : | ;; | ||
196 : | (p6) extr r14 = r14, 16, 16 | ||
197 : | .L40: | ||
198 : | //.pred.rel.mutex p6, p7 | ||
199 : | ;; | ||
200 : | (p6) st2 [r15] = r14 | ||
201 : | adds r14 = 1, r17 | ||
202 : | ;; | ||
203 : | dep.z r16 = r14, 1, 32 | ||
204 : | ;; | ||
205 : | add r15 = r16, r33 | ||
206 : | ;; | ||
207 : | ld2 r14 = [r15] | ||
208 : | ;; | ||
209 : | sxt2 r14 = r14 | ||
210 : | ;; | ||
211 : | mov r15 = r14 | ||
212 : | ;; | ||
213 : | cmp4.le p6, p7 = r0, r15 | ||
214 : | (p6) br.cond.dptk .L33 | ||
215 : | sub r14 = r0, r15 | ||
216 : | ;; | ||
217 : | sxt2 r14 = r14 | ||
218 : | ;; | ||
219 : | mov r15 = r14 | ||
220 : | ;; | ||
221 : | cmp4.le p6, p7 = r36, r15 | ||
222 : | ;; | ||
223 : | (p7) add r14 = r16, r32 | ||
224 : | (p6) setf.sig f6 = r15 | ||
225 : | ;; | ||
226 : | (p7) st2 [r14] = r0 | ||
227 : | (p6) xma.l f6 = f6, f2, f0 | ||
228 : | (p6) add r15 = r16, r32 | ||
229 : | ;; | ||
230 : | (p6) getf.sig r14 = f6 | ||
231 : | ;; | ||
232 : | (p6) extr r14 = r14, 16, 16 | ||
233 : | ;; | ||
234 : | (p6) sub r14 = r0, r14 | ||
235 : | br .L41 | ||
236 : | .L33: | ||
237 : | cmp4.le p6, p7 = r36, r15 | ||
238 : | ;; | ||
239 : | (p7) add r14 = r16, r32 | ||
240 : | (p6) add r15 = r16, r32 | ||
241 : | (p6) setf.sig f6 = r14 | ||
242 : | ;; | ||
243 : | (p7) st2 [r14] = r0 | ||
244 : | (p6) xma.l f6 = f6, f2, f0 | ||
245 : | ;; | ||
246 : | (p6) getf.sig r14 = f6 | ||
247 : | ;; | ||
248 : | (p6) extr r14 = r14, 16, 16 | ||
249 : | .L41: | ||
250 : | //.pred.rel.mutex p6, p7 | ||
251 : | ;; | ||
252 : | (p6) st2 [r15] = r14 | ||
253 : | adds r17 = 2, r17 | ||
254 : | br.cloop.sptk.few .L37 | ||
255 : | .L16: | ||
256 : | adds r18 = 24, r12 | ||
257 : | ;; | ||
258 : | ld8 r19 = [r18], 8 | ||
259 : | mov ar.pfs = r38 | ||
260 : | mov b0 = r37 | ||
261 : | ;; | ||
262 : | mov ar.lc = r19 | ||
263 : | ldf.fill f2 = [r18] | ||
264 : | .restore sp | ||
265 : | adds r12 = 32, r12 | ||
266 : | br.ret.sptk.many b0 | ||
267 : | .endp quant_intra_ia64# | ||
268 : | .align 16 | ||
269 : | .global quant_inter_ia64# | ||
270 : | .proc quant_inter_ia64# | ||
271 : | quant_inter_ia64: | ||
272 : | .prologue | ||
273 : | addl r14 = @ltoff(multipliers#), gp | ||
274 : | dep.z r15 = r34, 2, 32 | ||
275 : | .save ar.lc, r2 | ||
276 : | mov r2 = ar.lc | ||
277 : | ;; | ||
278 : | .body | ||
279 : | ld8 r14 = [r14] | ||
280 : | extr.u r16 = r34, 1, 16 | ||
281 : | dep.z r17 = r34, 1, 15 | ||
282 : | ;; | ||
283 : | add r15 = r15, r14 | ||
284 : | mov r18 = r16 | ||
285 : | mov r8 = r0 | ||
286 : | ;; | ||
287 : | ld4 r15 = [r15] | ||
288 : | addl r14 = 31, r0 | ||
289 : | mov r19 = r0 | ||
290 : | ;; | ||
291 : | setf.sig f6 = r15 | ||
292 : | mov ar.lc = r14 | ||
293 : | ;; | ||
294 : | .L65: | ||
295 : | dep.z r16 = r19, 1, 32 | ||
296 : | ;; | ||
297 : | add r14 = r16, r33 | ||
298 : | ;; | ||
299 : | ld2 r15 = [r14] | ||
300 : | ;; | ||
301 : | sxt2 r15 = r15 | ||
302 : | ;; | ||
303 : | mov r14 = r15 | ||
304 : | ;; | ||
305 : | cmp4.le p6, p7 = r0, r14 | ||
306 : | (p6) br.cond.dptk .L55 | ||
307 : | sub r14 = r0, r14 | ||
308 : | ;; | ||
309 : | sub r14 = r14, r18 | ||
310 : | ;; | ||
311 : | sxt2 r14 = r14 | ||
312 : | ;; | ||
313 : | cmp4.le p6, p7 = r17, r14 | ||
314 : | ;; | ||
315 : | (p7) add r14 = r16, r32 | ||
316 : | (p6) setf.sig f7 = r14 | ||
317 : | ;; | ||
318 : | (p7) st2 [r14] = r0 | ||
319 : | (p6) add r16 = r16, r32 | ||
320 : | (p6) xma.l f7 = f7, f6, f0 | ||
321 : | ;; | ||
322 : | (p6) getf.sig r14 = f7 | ||
323 : | ;; | ||
324 : | (p6) extr r14 = r14, 16, 16 | ||
325 : | ;; | ||
326 : | (p6) sub r15 = r0, r14 | ||
327 : | (p6) add r8 = r8, r14 | ||
328 : | ;; | ||
329 : | (p6) st2 [r16] = r15 | ||
330 : | br .L53 | ||
331 : | .L55: | ||
332 : | sub r14 = r14, r18 | ||
333 : | ;; | ||
334 : | sxt2 r14 = r14 | ||
335 : | ;; | ||
336 : | cmp4.le p6, p7 = r17, r14 | ||
337 : | ;; | ||
338 : | (p7) add r14 = r16, r32 | ||
339 : | (p6) add r15 = r16, r32 | ||
340 : | (p6) setf.sig f7 = r14 | ||
341 : | ;; | ||
342 : | (p7) st2 [r14] = r0 | ||
343 : | (p6) xma.l f7 = f7, f6, f0 | ||
344 : | ;; | ||
345 : | (p6) getf.sig r14 = f7 | ||
346 : | ;; | ||
347 : | (p6) extr r14 = r14, 16, 16 | ||
348 : | ;; | ||
349 : | (p6) st2 [r15] = r14 | ||
350 : | (p6) add r8 = r8, r14 | ||
351 : | .L53: | ||
352 : | adds r14 = 1, r19 | ||
353 : | ;; | ||
354 : | dep.z r16 = r14, 1, 32 | ||
355 : | ;; | ||
356 : | add r15 = r16, r33 | ||
357 : | ;; | ||
358 : | ld2 r14 = [r15] | ||
359 : | ;; | ||
360 : | sxt2 r14 = r14 | ||
361 : | ;; | ||
362 : | cmp4.le p6, p7 = r0, r14 | ||
363 : | (p6) br.cond.dptk .L61 | ||
364 : | sub r14 = r0, r14 | ||
365 : | ;; | ||
366 : | sub r14 = r14, r18 | ||
367 : | ;; | ||
368 : | sxt2 r14 = r14 | ||
369 : | ;; | ||
370 : | cmp4.le p6, p7 = r17, r14 | ||
371 : | ;; | ||
372 : | (p7) add r14 = r16, r32 | ||
373 : | (p6) setf.sig f7 = r14 | ||
374 : | ;; | ||
375 : | (p7) st2 [r14] = r0 | ||
376 : | (p6) add r16 = r16, r32 | ||
377 : | (p6) xma.l f7 = f7, f6, f0 | ||
378 : | ;; | ||
379 : | (p6) getf.sig r14 = f7 | ||
380 : | ;; | ||
381 : | (p6) extr r14 = r14, 16, 16 | ||
382 : | ;; | ||
383 : | (p6) sub r15 = r0, r14 | ||
384 : | (p6) add r8 = r8, r14 | ||
385 : | ;; | ||
386 : | (p6) st2 [r16] = r15 | ||
387 : | br .L59 | ||
388 : | .L61: | ||
389 : | sub r14 = r14, r18 | ||
390 : | ;; | ||
391 : | sxt2 r14 = r14 | ||
392 : | ;; | ||
393 : | cmp4.le p6, p7 = r17, r14 | ||
394 : | ;; | ||
395 : | (p7) add r14 = r16, r32 | ||
396 : | (p6) add r15 = r16, r32 | ||
397 : | (p6) setf.sig f7 = r14 | ||
398 : | ;; | ||
399 : | (p7) st2 [r14] = r0 | ||
400 : | (p6) xma.l f7 = f7, f6, f0 | ||
401 : | ;; | ||
402 : | (p6) getf.sig r14 = f7 | ||
403 : | ;; | ||
404 : | (p6) extr r14 = r14, 16, 16 | ||
405 : | ;; | ||
406 : | (p6) st2 [r15] = r14 | ||
407 : | (p6) add r8 = r8, r14 | ||
408 : | .L59: | ||
409 : | adds r19 = 2, r19 | ||
410 : | br.cloop.sptk.few .L65 | ||
411 : | ;; | ||
412 : | mov ar.lc = r2 | ||
413 : | br.ret.sptk.many b0 | ||
414 : | .endp quant_inter_ia64# | ||
415 : | .common quant_intra#,8,8 | ||
416 : | .common dequant_intra#,8,8 | ||
417 : | .align 16 | ||
418 : | .global dequant_intra_ia64# | ||
419 : | .proc dequant_intra_ia64# | ||
420 : | dequant_intra_ia64: | ||
421 : | .prologue | ||
422 : | ld2 r14 = [r33] | ||
423 : | andcm r15 = 1, r34 | ||
424 : | setf.sig f8 = r35 | ||
425 : | ;; | ||
426 : | sxt2 r14 = r14 | ||
427 : | sub r15 = r34, r15 | ||
428 : | addl r16 = -2048, r0 | ||
429 : | ;; | ||
430 : | setf.sig f6 = r14 | ||
431 : | setf.sig f7 = r15 | ||
432 : | shladd r34 = r34, 1, r0 | ||
433 : | ;; | ||
434 : | xma.l f8 = f6, f8, f0 | ||
435 : | .save ar.lc, r2 | ||
436 : | mov r2 = ar.lc | ||
437 : | ;; | ||
438 : | .body | ||
439 : | getf.sig r14 = f8 | ||
440 : | setf.sig f6 = r34 | ||
441 : | ;; | ||
442 : | sxt2 r15 = r14 | ||
443 : | st2 [r32] = r14 | ||
444 : | ;; | ||
445 : | cmp4.le p6, p7 = r16, r15 | ||
446 : | ;; | ||
447 : | (p7) st2 [r32] = r16 | ||
448 : | (p7) br.cond.dptk .L68 | ||
449 : | addl r14 = 2047, r0 | ||
450 : | ;; | ||
451 : | cmp4.ge p6, p7 = r14, r15 | ||
452 : | ;; | ||
453 : | (p7) st2 [r32] = r14 | ||
454 : | .L68: | ||
455 : | addl r14 = 20, r0 | ||
456 : | addl r19 = 1, r0 | ||
457 : | addl r21 = 2048, r0 | ||
458 : | addl r20 = -2048, r0 | ||
459 : | addl r18 = 2047, r0 | ||
460 : | ;; | ||
461 : | mov ar.lc = r14 | ||
462 : | ;; | ||
463 : | .L110: | ||
464 : | dep.z r16 = r19, 1, 32 | ||
465 : | ;; | ||
466 : | add r14 = r16, r33 | ||
467 : | ;; | ||
468 : | ld2 r15 = [r14] | ||
469 : | ;; | ||
470 : | sxt2 r15 = r15 | ||
471 : | ;; | ||
472 : | cmp4.ne p6, p7 = 0, r15 | ||
473 : | ;; | ||
474 : | (p7) add r14 = r16, r32 | ||
475 : | ;; | ||
476 : | (p7) st2 [r14] = r0 | ||
477 : | (p7) br.cond.dpnt .L92 | ||
478 : | cmp4.le p6, p7 = r0, r15 | ||
479 : | (p6) br.cond.dptk .L95 | ||
480 : | sub r14 = r0, r15 | ||
481 : | add r17 = r16, r32 | ||
482 : | ;; | ||
483 : | setf.sig f8 = r14 | ||
484 : | ;; | ||
485 : | xma.l f8 = f6, f8, f7 | ||
486 : | ;; | ||
487 : | getf.sig r15 = f8 | ||
488 : | ;; | ||
489 : | cmp4.lt p6, p7 = r21, r15 | ||
490 : | ;; | ||
491 : | (p7) sub r14 = r0, r15 | ||
492 : | ;; | ||
493 : | (p7) st2 [r17] = r14 | ||
494 : | (p6) st2 [r17] = r20 | ||
495 : | br .L92 | ||
496 : | .L95: | ||
497 : | setf.sig f8 = r15 | ||
498 : | add r14 = r16, r32 | ||
499 : | ;; | ||
500 : | xma.l f8 = f6, f8, f7 | ||
501 : | ;; | ||
502 : | getf.sig r15 = f8 | ||
503 : | ;; | ||
504 : | cmp4.le p6, p7 = r18, r15 | ||
505 : | ;; | ||
506 : | (p6) mov r15 = r18 | ||
507 : | ;; | ||
508 : | st2 [r14] = r15 | ||
509 : | .L92: | ||
510 : | adds r14 = 1, r19 | ||
511 : | ;; | ||
512 : | dep.z r17 = r14, 1, 32 | ||
513 : | ;; | ||
514 : | add r15 = r17, r33 | ||
515 : | ;; | ||
516 : | ld2 r14 = [r15] | ||
517 : | ;; | ||
518 : | sxt2 r14 = r14 | ||
519 : | ;; | ||
520 : | mov r16 = r14 | ||
521 : | ;; | ||
522 : | cmp4.ne p6, p7 = 0, r16 | ||
523 : | ;; | ||
524 : | (p7) add r14 = r17, r32 | ||
525 : | ;; | ||
526 : | (p7) st2 [r14] = r0 | ||
527 : | (p7) br.cond.dpnt .L98 | ||
528 : | cmp4.le p6, p7 = r0, r16 | ||
529 : | (p6) br.cond.dptk .L101 | ||
530 : | sub r14 = r0, r16 | ||
531 : | add r17 = r17, r32 | ||
532 : | ;; | ||
533 : | setf.sig f8 = r14 | ||
534 : | ;; | ||
535 : | xma.l f8 = f6, f8, f7 | ||
536 : | ;; | ||
537 : | getf.sig r16 = f8 | ||
538 : | ;; | ||
539 : | cmp4.lt p6, p7 = r21, r16 | ||
540 : | ;; | ||
541 : | (p7) sub r14 = r0, r16 | ||
542 : | ;; | ||
543 : | (p7) st2 [r17] = r14 | ||
544 : | (p6) st2 [r17] = r20 | ||
545 : | br .L98 | ||
546 : | .L101: | ||
547 : | setf.sig f8 = r16 | ||
548 : | add r14 = r17, r32 | ||
549 : | ;; | ||
550 : | xma.l f8 = f6, f8, f7 | ||
551 : | ;; | ||
552 : | getf.sig r16 = f8 | ||
553 : | ;; | ||
554 : | cmp4.le p6, p7 = r18, r16 | ||
555 : | ;; | ||
556 : | (p6) mov r15 = r18 | ||
557 : | (p7) mov r15 = r16 | ||
558 : | ;; | ||
559 : | st2 [r14] = r15 | ||
560 : | .L98: | ||
561 : | adds r14 = 2, r19 | ||
562 : | ;; | ||
563 : | dep.z r17 = r14, 1, 32 | ||
564 : | ;; | ||
565 : | add r15 = r17, r33 | ||
566 : | ;; | ||
567 : | ld2 r14 = [r15] | ||
568 : | ;; | ||
569 : | sxt2 r14 = r14 | ||
570 : | ;; | ||
571 : | mov r16 = r14 | ||
572 : | ;; | ||
573 : | cmp4.ne p6, p7 = 0, r16 | ||
574 : | ;; | ||
575 : | (p7) add r14 = r17, r32 | ||
576 : | ;; | ||
577 : | (p7) st2 [r14] = r0 | ||
578 : | (p7) br.cond.dpnt .L104 | ||
579 : | cmp4.le p6, p7 = r0, r16 | ||
580 : | (p6) br.cond.dptk .L107 | ||
581 : | sub r14 = r0, r16 | ||
582 : | add r17 = r17, r32 | ||
583 : | ;; | ||
584 : | setf.sig f8 = r14 | ||
585 : | ;; | ||
586 : | xma.l f8 = f6, f8, f7 | ||
587 : | ;; | ||
588 : | getf.sig r16 = f8 | ||
589 : | ;; | ||
590 : | cmp4.lt p6, p7 = r21, r16 | ||
591 : | ;; | ||
592 : | (p7) sub r14 = r0, r16 | ||
593 : | ;; | ||
594 : | (p7) st2 [r17] = r14 | ||
595 : | (p6) st2 [r17] = r20 | ||
596 : | br .L104 | ||
597 : | .L107: | ||
598 : | setf.sig f8 = r16 | ||
599 : | add r14 = r17, r32 | ||
600 : | ;; | ||
601 : | xma.l f8 = f6, f8, f7 | ||
602 : | ;; | ||
603 : | getf.sig r16 = f8 | ||
604 : | ;; | ||
605 : | cmp4.le p6, p7 = r18, r16 | ||
606 : | ;; | ||
607 : | (p6) mov r15 = r18 | ||
608 : | (p7) mov r15 = r16 | ||
609 : | ;; | ||
610 : | st2 [r14] = r15 | ||
611 : | .L104: | ||
612 : | adds r19 = 3, r19 | ||
613 : | br.cloop.sptk.few .L110 | ||
614 : | ;; | ||
615 : | mov ar.lc = r2 | ||
616 : | br.ret.sptk.many b0 | ||
617 : | .endp dequant_intra_ia64# | ||
618 : | .common quant_inter#,8,8 | ||
619 : | .common dequant_inter#,8,8 | ||
620 : | .align 16 | ||
621 : | .global dequant_inter_ia64# | ||
622 : | .proc dequant_inter_ia64# | ||
623 : | dequant_inter_ia64: | ||
624 : | .prologue | ||
625 : | andcm r14 = 1, r34 | ||
626 : | dep.z r15 = r34, 1, 15 | ||
627 : | .save ar.lc, r2 | ||
628 : | mov r2 = ar.lc | ||
629 : | ;; | ||
630 : | .body | ||
631 : | sub r34 = r34, r14 | ||
632 : | setf.sig f6 = r15 | ||
633 : | mov r19 = r0 | ||
634 : | addl r14 = 31, r0 | ||
635 : | addl r18 = -2048, r0 | ||
636 : | addl r17 = 2047, r0 | ||
637 : | ;; | ||
638 : | zxt2 r34 = r34 | ||
639 : | mov ar.lc = r14 | ||
640 : | ;; | ||
641 : | .L122: | ||
642 : | dep.z r16 = r19, 1, 32 | ||
643 : | ;; | ||
644 : | add r14 = r16, r33 | ||
645 : | ;; | ||
646 : | ld2 r15 = [r14] | ||
647 : | ;; | ||
648 : | sxt2 r15 = r15 | ||
649 : | ;; | ||
650 : | mov r14 = r15 | ||
651 : | ;; | ||
652 : | cmp4.ne p6, p7 = 0, r14 | ||
653 : | ;; | ||
654 : | (p7) add r14 = r16, r32 | ||
655 : | ;; | ||
656 : | (p7) st2 [r14] = r0 | ||
657 : | (p7) br.cond.dpnt .L112 | ||
658 : | cmp4.le p6, p7 = r0, r14 | ||
659 : | (p6) br.cond.dptk .L115 | ||
660 : | setf.sig f7 = r14 | ||
661 : | add r15 = r16, r32 | ||
662 : | ;; | ||
663 : | xma.l f7 = f7, f6, f0 | ||
664 : | ;; | ||
665 : | getf.sig r14 = f7 | ||
666 : | ;; | ||
667 : | sub r14 = r14, r34 | ||
668 : | ;; | ||
669 : | sxt2 r14 = r14 | ||
670 : | ;; | ||
671 : | cmp4.le p6, p7 = r18, r14 | ||
672 : | ;; | ||
673 : | (p7) mov r14 = r18 | ||
674 : | br .L123 | ||
675 : | .L115: | ||
676 : | setf.sig f8 = r15 | ||
677 : | setf.sig f7 = r34 | ||
678 : | ;; | ||
679 : | xma.l f8 = f8, f6, f7 | ||
680 : | add r15 = r16, r32 | ||
681 : | ;; | ||
682 : | getf.sig r14 = f8 | ||
683 : | ;; | ||
684 : | sxt2 r14 = r14 | ||
685 : | ;; | ||
686 : | cmp4.le p6, p7 = r17, r14 | ||
687 : | ;; | ||
688 : | (p6) mov r14 = r17 | ||
689 : | ;; | ||
690 : | .L123: | ||
691 : | st2 [r15] = r14 | ||
692 : | .L112: | ||
693 : | adds r14 = 1, r19 | ||
694 : | ;; | ||
695 : | dep.z r16 = r14, 1, 32 | ||
696 : | ;; | ||
697 : | add r15 = r16, r33 | ||
698 : | ;; | ||
699 : | ld2 r14 = [r15] | ||
700 : | ;; | ||
701 : | sxt2 r14 = r14 | ||
702 : | ;; | ||
703 : | mov r15 = r14 | ||
704 : | ;; | ||
705 : | cmp4.ne p6, p7 = 0, r15 | ||
706 : | ;; | ||
707 : | (p7) add r14 = r16, r32 | ||
708 : | ;; | ||
709 : | (p7) st2 [r14] = r0 | ||
710 : | (p7) br.cond.dpnt .L117 | ||
711 : | cmp4.le p6, p7 = r0, r15 | ||
712 : | (p6) br.cond.dptk .L120 | ||
713 : | setf.sig f8 = r15 | ||
714 : | ;; | ||
715 : | xma.l f8 = f8, f6, f0 | ||
716 : | add r15 = r16, r32 | ||
717 : | ;; | ||
718 : | getf.sig r14 = f8 | ||
719 : | ;; | ||
720 : | sub r14 = r14, r34 | ||
721 : | ;; | ||
722 : | sxt2 r14 = r14 | ||
723 : | ;; | ||
724 : | cmp4.le p6, p7 = r18, r14 | ||
725 : | ;; | ||
726 : | (p7) mov r14 = r18 | ||
727 : | br .L124 | ||
728 : | ;; | ||
729 : | .L120: | ||
730 : | setf.sig f7 = r14 | ||
731 : | setf.sig f8 = r34 | ||
732 : | add r15 = r16, r32 | ||
733 : | ;; | ||
734 : | xma.l f7 = f7, f6, f8 | ||
735 : | ;; | ||
736 : | getf.sig r14 = f7 | ||
737 : | ;; | ||
738 : | sxt2 r14 = r14 | ||
739 : | ;; | ||
740 : | cmp4.le p6, p7 = r17, r14 | ||
741 : | ;; | ||
742 : | (p6) mov r14 = r17 | ||
743 : | ;; | ||
744 : | .L124: | ||
745 : | st2 [r15] = r14 | ||
746 : | .L117: | ||
747 : | adds r19 = 2, r19 | ||
748 : | br.cloop.sptk.few .L122 | ||
749 : | ;; | ||
750 : | mov ar.lc = r2 | ||
751 : | br.ret.sptk.many b0 | ||
752 : | .endp dequant_inter_ia64# | ||
753 : | .ident "GCC: (GNU) 2.96 20000731 (Red Hat Linux 7.1 2.96-85)" |
No admin address has been configured | ViewVC Help |
Powered by ViewVC 1.0.4 |