mirror of
				https://github.com/nyanmisaka/ffmpeg-rockchip.git
				synced 2025-10-26 10:20:52 +08:00 
			
		
		
		
	 d2ae5f77c6
			
		
	
	d2ae5f77c6
	
	
	
		
			
			Performance improvements: quant_bands: with: 681 decicycles in quant_bands, 8388453 runs, 155 skips without: 1190 decicycles in quant_bands, 8388386 runs, 222 skips Around 42% for the function Twoloop coder: abs_pow34: with/without: 7.82s/8.17s Around 4% for the entire encoder Both: with/without: 7.15s/8.17s Around 12% for the entire encoder Fast coder: abs_pow34: with/without: 3.40s/3.77s Around 10% for the entire encoder Both: with/without: 3.02s/3.77s Around 20% faster for the entire encoder Signed-off-by: Rostislav Pehlivanov <atomnuker@gmail.com> Tested-by: Michael Niedermayer <michael@niedermayer.cc> Reviewed-by: James Almer <jamrial@gmail.com>
		
			
				
	
	
		
			44 lines
		
	
	
		
			1.5 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			44 lines
		
	
	
		
			1.5 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /*
 | |
|  * AAC encoder assembly optimizations
 | |
|  * Copyright (C) 2016 Rostislav Pehlivanov <atomnuker@gmail.com>
 | |
|  *
 | |
|  * This file is part of FFmpeg.
 | |
|  *
 | |
|  * FFmpeg is free software; you can redistribute it and/or
 | |
|  * modify it under the terms of the GNU Lesser General Public
 | |
|  * License as published by the Free Software Foundation; either
 | |
|  * version 2.1 of the License, or (at your option) any later version.
 | |
|  *
 | |
|  * FFmpeg is distributed in the hope that it will be useful,
 | |
|  * but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 | |
|  * Lesser General Public License for more details.
 | |
|  *
 | |
|  * You should have received a copy of the GNU Lesser General Public
 | |
|  * License along with FFmpeg; if not, write to the Free Software
 | |
|  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 | |
|  */
 | |
| 
 | |
| #include "config.h"
 | |
| 
 | |
| #include "libavutil/float_dsp.h"
 | |
| #include "libavutil/x86/cpu.h"
 | |
| #include "libavcodec/aacenc.h"
 | |
| 
 | |
| void ff_abs_pow34_sse(float *out, const float *in, const int size);
 | |
| 
 | |
| void ff_aac_quantize_bands_sse2(int *out, const float *in, const float *scaled,
 | |
|                                 int size, int is_signed, int maxval, const float Q34,
 | |
|                                 const float rounding);
 | |
| 
 | |
| av_cold void ff_aac_dsp_init_x86(AACEncContext *s)
 | |
| {
 | |
|     int cpu_flags = av_get_cpu_flags();
 | |
| 
 | |
|     if (EXTERNAL_SSE(cpu_flags))
 | |
|         s->abs_pow34   = ff_abs_pow34_sse;
 | |
| 
 | |
|     if (EXTERNAL_SSE2(cpu_flags))
 | |
|         s->quant_bands = ff_aac_quantize_bands_sse2;
 | |
| }
 |