tianlef 
							
						 
					 
					
						
						
							
						
						0bc7d076fc 
					 
					
						
						
							
							[CE]add x1 w4a8c8 benchamrk config ( #3607 )  
						
						... 
						
						
						
						* [CE]add x1 w4a8c8 benchamrk config
* [CE]add x1 w4a8c8 benchamrk config
* [CE]add x1 w4a8c8 benchamrk config 
						
						
					 
					
						2025-08-26 11:27:32 +08:00 
						 
				 
			
				
					
						
							
							
								Zhang Yulong 
							
						 
					 
					
						
						
							
						
						9ff2dfb162 
					 
					
						
						
							
							Create eb45-8k-fp8-tp1-dp8_ep.yaml ( #3485 )  
						
						... 
						
						
	
		
			
	 
	
	
		
	
	
		
			
				
	Deploy GitHub Pages / deploy (push) Has been cancelled 
				
			 
		
			
				
	Publish Job / publish_pre_check (push) Has been cancelled 
				
			 
		
			
				
	Publish Job / print_publish_pre_check_outputs (push) Has been cancelled 
				
			 
		
			
				
	Publish Job / FD-Clone-Linux (push) Has been cancelled 
				
			 
		
			
				
	Publish Job / Show Code Archive Output (push) Has been cancelled 
				
			 
		
			
				
	Publish Job / BUILD_SM8090 (push) Has been cancelled 
				
			 
		
			
				
	Publish Job / BUILD_SM8689 (push) Has been cancelled 
				
			 
		
			
				
	Publish Job / PADDLE_PYPI_UPLOAD_8090 (push) Has been cancelled 
				
			 
		
			
				
	Publish Job / PADDLE_PYPI_UPLOAD_8689 (push) Has been cancelled 
				
			 
		
			
				
	Publish Job / Run FastDeploy Unit Tests and Coverage (push) Has been cancelled 
				
			 
		
			
				
	Publish Job / Run FastDeploy LogProb Tests (push) Has been cancelled 
				
			 
		
			
				
	Publish Job / Extracted partial CE model tasks to run in CI. (push) Has been cancelled 
				
			 
		
			
				
	Publish Job / Run Base Tests (push) Has been cancelled 
				
			 
		
			
				
	Publish Job / Run Accuracy Tests (push) Has been cancelled 
				
			 
		
		
	 
 
	 
						
						混合架构EP并行yaml 
						
						
					 
					
						2025-08-20 14:33:54 +08:00 
						 
				 
			
				
					
						
							
							
								yinwei 
							
						 
					 
					
						
						
							
						
						776fb03250 
					 
					
						
						
							
							add error info ( #3040 )  
						
						
						
						
					 
					
						2025-07-28 15:10:28 +08:00 
						 
				 
			
				
					
						
							
							
								Zhang Yulong 
							
						 
					 
					
						
						
							
						
						5151bc92c8 
					 
					
						
						
							
							Update benchmark tools ( #3004 )  
						
						... 
						
						
	
		
			
	 
	
	
		
	
	
		
			
				
	Deploy GitHub Pages / deploy (push) Has been cancelled 
				
			 
		
		
	 
 
	 
						
						* update benchmark tools
* update benchmark tools 
						
						
					 
					
						2025-07-24 15:19:23 +08:00 
						 
				 
			
				
					
						
							
							
								xiegegege 
							
						 
					 
					
						
						
							
						
						e3a843f2c5 
					 
					
						
						
							
							[benchmark] add quantization for benchmark yaml ( #2995 )  
						
						
						
						
					 
					
						2025-07-24 13:26:34 +08:00 
						 
				 
			
				
					
						
							
							
								Zero Rains 
							
						 
					 
					
						
						
							
						
						25698d56d1 
					 
					
						
						
							
							polish code with new pre-commit rule ( #2923 )  
						
						
						
						
					 
					
						2025-07-19 23:19:27 +08:00 
						 
				 
			
				
					
						
							
							
								RAM 
							
						 
					 
					
						
						
							
						
						0fad10b35a 
					 
					
						
						
							
							[Executor] CUDA Graph support padding batch ( #2844 )  
						
						... 
						
						
						
						* cuda graph support padding batch
* Integrate the startup parameters for the graph optimization backend and provide support for user - defined capture sizes.
* Do not insert max_num_seqs when the user specifies a capture list
* Support set graph optimization config from YAML file
* update cuda graph ci
* fix ci bug
* fix ci bug 
						
						
					 
					
						2025-07-15 19:49:01 -07:00 
						 
				 
			
				
					
						
							
							
								ophilia-lee 
							
						 
					 
					
						
						
							
						
						33db137d0b 
					 
					
						
						
							
							新增vLLM默认请求参数yaml  
						
						
						
						
					 
					
						2025-07-15 19:31:27 +08:00 
						 
				 
			
				
					
						
							
							
								lijingning 
							
						 
					 
					
						
						
							
						
						9d6a42b334 
					 
					
						
						
							
							适配vLLM无arrival_time;适配vLLM model必传;RequestFuncInput/RequestFuncOutput/SampleRequest新增用例编号no  
						
						
						
						
					 
					
						2025-07-15 19:31:27 +08:00 
						 
				 
			
				
					
						
							
							
								GoldPancake 
							
						 
					 
					
						
						
							
						
						f7cad30a38 
					 
					
						
						
							
							[Feature] Add speculative decoding simulation benchmark. ( #2751 )  
						
						... 
						
						
						
						* Add speculative decoding simulation benchmark
* Fix the name of the parameter 
						
						
					 
					
						2025-07-09 12:08:43 +08:00 
						 
				 
			
				
					
						
							
							
								Divano 
							
						 
					 
					
						
						
							
						
						050d9658a5 
					 
					
						
						
							
							Update requirements.txt  
						
						
						
						
					 
					
						2025-07-04 09:53:03 +08:00 
						 
				 
			
				
					
						
							
							
								Divano 
							
						 
					 
					
						
						
							
						
						be5cabaf80 
					 
					
						
						
							
							add quick benchmark ( #2703 )  
						
						... 
						
						
						
						测试脚本不需要过CI 
						
						
					 
					
						2025-07-04 09:32:36 +08:00 
						 
				 
			
				
					
						
							
							
								Zhang Yulong 
							
						 
					 
					
						
						
							
						
						264ddfdf8a 
					 
					
						
						
							
							Update README.md  
						
						
						
						
					 
					
						2025-06-30 10:28:15 +08:00 
						 
				 
			
				
					
						
							
							
								Jiang-Jia-Jun 
							
						 
					 
					
						
						
							
						
						92c2cfa2e7 
					 
					
						
						
							
							Sync v2.0 version of code to github repo  
						
						
						
						
					 
					
						2025-06-29 23:29:37 +00:00