|
717 | 717 |
|
718 | 718 | #define MULADDC_X1_CORE \
|
719 | 719 | ".p2align 2 \n\t" \
|
720 |
| - "ldr.w %[a], [%[in]], #4 \n\t" \ |
721 |
| - "ldr.w %[b], [%[acc]] \n\t" \ |
| 720 | + "ldr %[a], [%[in]], #4 \n\t" \ |
| 721 | + "ldr %[b], [%[acc]] \n\t" \ |
722 | 722 | "umaal %[b], %[carry], %[scalar], %[a] \n\t" \
|
723 |
| - "str.w %[b], [%[acc]], #4 \n\t" |
| 723 | + "str %[b], [%[acc]], #4 \n\t" |
724 | 724 |
|
725 | 725 | #define MULADDC_X1_STOP \
|
726 | 726 | : [a] "=&r" (tmp_a), \
|
|
751 | 751 | * 2 cycles, while subsequent loads/stores are single-cycle. */
|
752 | 752 | #define MULADDC_X2_CORE \
|
753 | 753 | ".p2align 2 \n\t" \
|
754 |
| - "ldr.w %[a0], [%[in]], #+8 \n\t" \ |
755 |
| - "ldr.w %[b0], [%[acc]], #+8 \n\t" \ |
756 |
| - "ldr.w %[a1], [%[in], #-4] \n\t" \ |
757 |
| - "ldr.w %[b1], [%[acc], #-4] \n\t" \ |
| 754 | + "ldr %[a0], [%[in]], #+8 \n\t" \ |
| 755 | + "ldr %[b0], [%[acc]], #+8 \n\t" \ |
| 756 | + "ldr %[a1], [%[in], #-4] \n\t" \ |
| 757 | + "ldr %[b1], [%[acc], #-4] \n\t" \ |
758 | 758 | "umaal %[b0], %[carry], %[scalar], %[a0] \n\t" \
|
759 | 759 | "umaal %[b1], %[carry], %[scalar], %[a1] \n\t" \
|
760 |
| - "str.w %[b0], [%[acc], #-8] \n\t" \ |
761 |
| - "str.w %[b1], [%[acc], #-4] \n\t" |
| 760 | + "str %[b0], [%[acc], #-8] \n\t" \ |
| 761 | + "str %[b1], [%[acc], #-4] \n\t" |
762 | 762 |
|
763 | 763 | #define MULADDC_X2_STOP \
|
764 | 764 | : [a0] "=&r" (tmp_a0), \
|
|
0 commit comments