tests: add armv7 debug test and a register dumper
[pandora-misc.git] / tests / neoncpy.S
1         .fpu neon
2         .text
3
4         .global memcpy_neon
5         .func   memcpy_neon
6 memcpy_neon:
7         push            {r4-r11}
8         mov             r3, r0
9 1:      pld             [r1, #192]
10         pld             [r1, #256]
11         vld1.64         {d0-d3},   [r1,:128]!
12         vld1.64         {d4-d7},   [r1,:128]!
13         vld1.64         {d16-d19}, [r1,:128]!
14         ldm             r1!, {r4-r11}
15         subs            r2, r2, #128
16         vst1.64         {d0-d3},   [r3,:128]!
17         vst1.64         {d4-d7},   [r3,:128]!
18         vst1.64         {d16-d19}, [r3,:128]!
19         stm             r3!, {r4-r11}
20         bgt             1b
21         pop             {r4-r11}
22         bx              lr
23         .endfunc