|
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210 |
-
-
- #if defined(__MK20DX128__) || defined(__MK20DX256__) || defined(__MK64FX512__) || defined(__MK66FX1M0__)
-
- .cpu cortex-m4
- .syntax unified
- .thumb
- .text
- .align 2
-
-
- .global memcpy_tointerleaveLR
- .thumb_func
- memcpy_tointerleaveLR:
-
-
-
-
-
- push {r4-r11,r14}
- add r14,r0,#256 // TODO: 256 = AUDIO_BLOCK_SAMPLES*2
- .align 2
- .loopLR:
-
- .irp offset, 1,2
-
- //Load 2*4 words
- ldmia r1!, {r5,r7,r9,r11} //1+4
- ldmia r2!, {r6,r8,r10,r12} //1+4
-
- pkhbt r3,r5,r6,LSL #16 //1
- pkhtb r4,r6,r5,ASR #16 //1
-
- pkhbt r5,r7,r8,LSL #16 //1
- pkhtb r6,r8,r7,ASR #16 //1
-
- pkhbt r7,r9,r10,LSL #16 //1
- pkhtb r8,r10,r9,ASR #16 //1
-
- pkhbt r9,r11,r12,LSL #16 //1
- pkhtb r10,r12,r11,ASR #16 //1
-
- //Write 8 Words
- stmia r0!, {r3,r4,r5,r6,r7,r8,r9,r10} //1+8
-
- .endr //5+5+8+9 = 27 Cycles to interleave 32 bytes.
-
- cmp r14, r0
- bne .loopLR
-
- pop {r4-r11,r14}
- BX lr
-
-
-
- .global memcpy_tointerleaveL
- .thumb_func
- memcpy_tointerleaveL:
-
-
-
-
- push {r4-r11}
- mov r2, #0
- add r12,r0,#256 // TODO: 256 = AUDIO_BLOCK_SAMPLES*2
- .align 2
- .loopL:
-
- .irp offset, 1,2
-
- //Load 4 words
- ldmia r1!, {r5,r7,r9,r11} //1+4
-
- pkhbt r3,r5,r2 //1
- pkhtb r4,r2,r5,ASR #16 //1
-
- pkhbt r5,r7,r2 //1
- pkhtb r6,r2,r7,ASR #16 //1
-
- pkhbt r7,r9,r2 //1
- pkhtb r8,r2,r9,ASR #16 //1
-
- pkhbt r9,r11,r2 //1
- pkhtb r10,r2,r11,ASR #16 //1
-
- //Write 8 Words
- stmia r0!, {r3,r4,r5,r6,r7,r8,r9,r10} //1+8
-
- .endr
-
- cmp r12, r0
- bne .loopL
-
- pop {r4-r11}
- BX lr
-
-
- .global memcpy_tointerleaveR
- .thumb_func
- memcpy_tointerleaveR:
-
-
-
-
- push {r4-r11}
- mov r2, #0
- add r12,r0,#256 // TODO: 256 = AUDIO_BLOCK_SAMPLES*2
- .align 2
- .loopR:
-
- .irp offset, 1,2
-
- //Load 4 words
- ldmia r1!, {r5,r7,r9,r11}
-
- pkhbt r3,r2,r5,LSL #16
- pkhtb r4,r5,r2
-
- pkhbt r5,r2,r7,LSL #16
- pkhtb r6,r7,r2
-
- pkhbt r7,r2,r9,LSL #16
- pkhtb r8,r9,r2
-
- pkhbt r9,r2,r11,LSL #16
- pkhtb r10,r11,r2
-
- //Write 8 Words
- stmia r0!, {r3,r4,r5,r6,r7,r8,r9,r10}
-
- .endr
-
- cmp r12, r0
- bne .loopR
-
- pop {r4-r11}
- BX lr
-
-
-
-
- .global memcpy_tointerleaveQuad
- .thumb_func
- memcpy_tointerleaveQuad:
-
-
-
-
-
-
-
- push {r4-r11}
- ldr r4, [sp, #(0+32)] //5th parameter is saved on the stack
- add r11,r0,#512 // TODO: 512 = AUDIO_BLOCK_SAMPLES*4
- .align 2
- .loopQuad:
-
- .irp offset, 1,2
-
- ldr r5, [r1],4
- ldr r6, [r3],4
- pkhbt r7,r5,r6,LSL #16
- pkhtb r9,r6,r5,ASR #16
- ldr r5, [r2],4
- ldr r6, [r4],4
- pkhbt r8,r5,r6,LSL #16
- pkhtb r10,r6,r5,ASR #16
-
- stmia r0!, {r7-r10}
-
- .endr
-
- cmp r11, r0
- bne .loopQuad
-
- pop {r4-r11}
-
- BX lr
-
-
- .END
-
- #endif
|