mirror of
				https://github.com/nyanmisaka/ffmpeg-rockchip.git
				synced 2025-10-31 20:42:49 +08:00 
			
		
		
		
	lavc/aacpsdsp: unroll RISC-V V add_squares
This slightly improves performance with the Device Under Test.
This commit is contained in:
		| @@ -22,13 +22,13 @@ | |||||||
|  |  | ||||||
| func ff_ps_add_squares_rvv, zve32f | func ff_ps_add_squares_rvv, zve32f | ||||||
| 1: | 1: | ||||||
|         vsetvli     t0, a2, e32, m1, ta, ma |         vsetvli     t0, a2, e32, m4, ta, ma | ||||||
|         vlseg2e32.v v24, (a1) |         vlseg2e32.v v24, (a1) | ||||||
|         sub         a2, a2, t0 |         sub         a2, a2, t0 | ||||||
|         vle32.v     v16, (a0) |         vle32.v     v16, (a0) | ||||||
|         sh3add      a1, t0, a1 |         sh3add      a1, t0, a1 | ||||||
|         vfmacc.vv   v16, v24, v24 |         vfmacc.vv   v16, v24, v24 | ||||||
|         vfmacc.vv   v16, v25, v25 |         vfmacc.vv   v16, v28, v28 | ||||||
|         vse32.v     v16, (a0) |         vse32.v     v16, (a0) | ||||||
|         sh2add      a0, t0, a0 |         sh2add      a0, t0, a0 | ||||||
|         bnez        a2, 1b |         bnez        a2, 1b | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user
	 Rémi Denis-Courmont
					Rémi Denis-Courmont