mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-12-24 13:28:13 +08:00
[Iluvatar] Support V1_KVCACHE_SCHEDULER and paddleocr-vl rope mode (#5555)
This commit is contained in:
@@ -28,8 +28,13 @@ __global__ void PrefixSumKernel(int64_t *ids_remove_padding,
|
||||
const int max_seq_len) {
|
||||
const int bi = blockIdx.x;
|
||||
const int tid = threadIdx.x;
|
||||
#ifdef PADDLE_WITH_COREX
|
||||
const int warp_id = threadIdx.x / 64;
|
||||
const int lane_id = threadIdx.x % 64;
|
||||
#else
|
||||
const int warp_id = threadIdx.x / 32;
|
||||
const int lane_id = threadIdx.x % 32;
|
||||
#endif
|
||||
|
||||
int cum_seq_len = 0;
|
||||
|
||||
|
||||
Reference in New Issue
Block a user