project:cfg:BoardConfig_IPC: Added fastboot BoardConfig file and firmware post-scripts, distinguishing between the BoardConfigs for Luckfox Pico Pro and Luckfox Pico Max. project:app: Added fastboot_client and rk_smart_door for quick boot applications; updated rkipc app to adapt to the latest media library. media:samples: Added more usage examples. media:rockit: Fixed bugs; removed support for retrieving data frames from VPSS. media:isp: Updated rkaiq library and related tools to support connection to RKISP_Tuner. sysdrv:Makefile: Added support for compiling drv_ko on Luckfox Pico Ultra W using Ubuntu; added support for custom root filesystem. sysdrv:tools:board: Updated Buildroot optional mirror sources, updated some software versions, and stored device tree files and configuration files that undergo multiple modifications for U-Boot and kernel separately. sysdrv:source:mcu: Used RISC-V MCU SDK with RT-Thread system, mainly for initializing camera AE during quick boot. sysdrv:source:uboot: Added support for fastboot; added high baud rate DDR bin for serial firmware upgrades. sysdrv:source:kernel: Upgraded to version 5.10.160; increased NPU frequency for RV1106G3; added support for fastboot. Signed-off-by: luckfox-eng29 <eng29@luckfox.com>
186 lines
5.4 KiB
ArmAsm
186 lines
5.4 KiB
ArmAsm
/*
|
|
* Copyright © 2016 Siarhei Siamashka <siarhei.siamashka@gmail.com>
|
|
*
|
|
* Permission is hereby granted, free of charge, to any person obtaining a
|
|
* copy of this software and associated documentation files (the "Software"),
|
|
* to deal in the Software without restriction, including without limitation
|
|
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
* and/or sell copies of the Software, and to permit persons to whom the
|
|
* Software is furnished to do so, subject to the following conditions:
|
|
*
|
|
* The above copyright notice and this permission notice (including the next
|
|
* paragraph) shall be included in all copies or substantial portions of the
|
|
* Software.
|
|
*
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
|
|
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
|
|
* DEALINGS IN THE SOFTWARE.
|
|
*/
|
|
|
|
#ifdef __aarch64__
|
|
|
|
.cpu cortex-a53+fp+simd
|
|
.text
|
|
.align 2
|
|
|
|
#define PREFETCH_DISTANCE 320
|
|
|
|
.macro asm_function function_name
|
|
.global \function_name
|
|
.type \function_name,%function
|
|
.func \function_name
|
|
\function_name:
|
|
DST .req x0
|
|
SRC .req x1
|
|
SIZE .req x2
|
|
.endm
|
|
|
|
asm_function aligned_block_copy_ldpstp_x_aarch64
|
|
0:
|
|
ldp x3, x4, [SRC, #(0 * 16)]
|
|
ldp x5, x6, [SRC, #(1 * 16)]
|
|
ldp x7, x8, [SRC, #(2 * 16)]
|
|
ldp x9, x10, [SRC, #(3 * 16)]
|
|
add SRC, SRC, #64
|
|
stp x3, x4, [DST, #(0 * 16)]
|
|
stp x5, x6, [DST, #(1 * 16)]
|
|
stp x7, x8, [DST, #(2 * 16)]
|
|
stp x9, x10, [DST, #(3 * 16)]
|
|
add DST, DST, #64
|
|
subs SIZE, SIZE, #64
|
|
bgt 0b
|
|
ret
|
|
.endfunc
|
|
|
|
asm_function aligned_block_copy_ldpstp_q_aarch64
|
|
0:
|
|
ldp q0, q1, [SRC, #(0 * 32)]
|
|
ldp q2, q3, [SRC, #(1 * 32)]
|
|
add SRC, SRC, #64
|
|
stp q0, q1, [DST, #(0 * 32)]
|
|
stp q2, q3, [DST, #(1 * 32)]
|
|
add DST, DST, #64
|
|
subs SIZE, SIZE, #64
|
|
bgt 0b
|
|
ret
|
|
.endfunc
|
|
|
|
asm_function aligned_block_copy_ldpstp_q_pf32_l2strm_aarch64
|
|
0:
|
|
prfm pldl2strm, [SRC, #(PREFETCH_DISTANCE + 0)]
|
|
ldp q0, q1, [SRC, #(0 * 32)]
|
|
prfm pldl2strm, [SRC, #(PREFETCH_DISTANCE + 32)]
|
|
ldp q2, q3, [SRC, #(1 * 32)]
|
|
add SRC, SRC, #64
|
|
stp q0, q1, [DST, #(0 * 32)]
|
|
stp q2, q3, [DST, #(1 * 32)]
|
|
add DST, DST, #64
|
|
subs SIZE, SIZE, #64
|
|
bgt 0b
|
|
ret
|
|
.endfunc
|
|
|
|
asm_function aligned_block_copy_ldpstp_q_pf64_l2strm_aarch64
|
|
0:
|
|
prfm pldl2strm, [SRC, #(PREFETCH_DISTANCE)]
|
|
ldp q0, q1, [SRC, #(0 * 32)]
|
|
ldp q2, q3, [SRC, #(1 * 32)]
|
|
add SRC, SRC, #64
|
|
stp q0, q1, [DST, #(0 * 32)]
|
|
stp q2, q3, [DST, #(1 * 32)]
|
|
add DST, DST, #64
|
|
subs SIZE, SIZE, #64
|
|
bgt 0b
|
|
ret
|
|
.endfunc
|
|
|
|
asm_function aligned_block_copy_ldpstp_q_pf32_l1keep_aarch64
|
|
0:
|
|
prfm pldl1keep, [SRC, #(PREFETCH_DISTANCE + 0)]
|
|
ldp q0, q1, [SRC, #(0 * 32)]
|
|
prfm pldl1keep, [SRC, #(PREFETCH_DISTANCE + 32)]
|
|
ldp q2, q3, [SRC, #(1 * 32)]
|
|
add SRC, SRC, #64
|
|
stp q0, q1, [DST, #(0 * 32)]
|
|
stp q2, q3, [DST, #(1 * 32)]
|
|
add DST, DST, #64
|
|
subs SIZE, SIZE, #64
|
|
bgt 0b
|
|
ret
|
|
.endfunc
|
|
|
|
asm_function aligned_block_copy_ldpstp_q_pf64_l1keep_aarch64
|
|
0:
|
|
prfm pldl1keep, [SRC, #(PREFETCH_DISTANCE)]
|
|
ldp q0, q1, [SRC, #(0 * 32)]
|
|
ldp q2, q3, [SRC, #(1 * 32)]
|
|
add SRC, SRC, #64
|
|
stp q0, q1, [DST, #(0 * 32)]
|
|
stp q2, q3, [DST, #(1 * 32)]
|
|
add DST, DST, #64
|
|
subs SIZE, SIZE, #64
|
|
bgt 0b
|
|
ret
|
|
.endfunc
|
|
|
|
asm_function aligned_block_fill_stp_x_aarch64
|
|
0:
|
|
stp x3, x4, [DST, #(0 * 16)]
|
|
stp x5, x6, [DST, #(1 * 16)]
|
|
stp x7, x8, [DST, #(2 * 16)]
|
|
stp x9, x10, [DST, #(3 * 16)]
|
|
add DST, DST, #64
|
|
subs SIZE, SIZE, #64
|
|
bgt 0b
|
|
ret
|
|
.endfunc
|
|
|
|
asm_function aligned_block_fill_stp_q_aarch64
|
|
0:
|
|
stp q0, q1, [DST, #(0 * 32)]
|
|
stp q2, q3, [DST, #(1 * 32)]
|
|
add DST, DST, #64
|
|
subs SIZE, SIZE, #64
|
|
bgt 0b
|
|
ret
|
|
.endfunc
|
|
|
|
asm_function aligned_block_fill_stnp_x_aarch64
|
|
0:
|
|
stnp x3, x4, [DST, #(0 * 16)]
|
|
stnp x5, x6, [DST, #(1 * 16)]
|
|
stnp x7, x8, [DST, #(2 * 16)]
|
|
stnp x9, x10, [DST, #(3 * 16)]
|
|
add DST, DST, #64
|
|
subs SIZE, SIZE, #64
|
|
bgt 0b
|
|
ret
|
|
.endfunc
|
|
|
|
asm_function aligned_block_fill_stnp_q_aarch64
|
|
0:
|
|
stnp q0, q1, [DST, #(0 * 32)]
|
|
stnp q2, q3, [DST, #(1 * 32)]
|
|
add DST, DST, #64
|
|
subs SIZE, SIZE, #64
|
|
bgt 0b
|
|
ret
|
|
.endfunc
|
|
|
|
asm_function aligned_block_copy_ld1st1_aarch64
|
|
0:
|
|
ld1 {v0.16b, v1.16b, v2.16b, v3.16b}, [SRC]
|
|
st1 {v0.16b, v1.16b, v2.16b, v3.16b}, [DST]
|
|
add SRC, SRC, #64
|
|
add DST, DST, #64
|
|
subs SIZE, SIZE, #64
|
|
bgt 0b
|
|
ret
|
|
.endfunc
|
|
|
|
#endif
|