Browse Source

!10514 [MSLITE][DEVELOP] fix bug of arm cpu fp32 op: deconv depthwise

From: @yangruoqi713
Reviewed-by: @zhanghaibo5,@zhang_xue_tong
Signed-off-by: @zhang_xue_tong
tags/v1.2.0-rc1
mindspore-ci-bot Gitee 5 years ago
parent
commit
8d3e09cfe3
1 changed files with 5 additions and 0 deletions
  1. +5
    -0
      mindspore/lite/nnacl/assembly/arm64/DeconvDwFp32Border.S

+ 5
- 0
mindspore/lite/nnacl/assembly/arm64/DeconvDwFp32Border.S View File

@@ -16,6 +16,10 @@ DeconvDwFp32Border:
// https://github.com/ARM-software/abi-aa/blob/master/aapcs64/aapcs64.rst#simd-and-floating-point-registers
// x19 ~ x29 should be also preserved
// whereas our coding style do not permit such amount of parameters
cmp x3, #0
beq End
cmp x4, #0
beq End
ld1 {v1.4s}, [x1]

mov x13, x0
@@ -35,5 +39,6 @@ DeconvDwFp32Border:
add x13, x13, x5
add x14, x14, x7
bne LoopH
End:
ret
#endif

Loading…
Cancel
Save