mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-05 16:48:03 +08:00
[Feature][MTP] Support cacheKV transfer in per_chunk mode (#2890)
* support chunk_prefill both normal and speculative_decoding(mtp) * optimize pd-disaggregation config * fix bug
This commit is contained in:
@@ -35,5 +35,5 @@ struct msgdata {
|
||||
|
||||
struct msgdatakv {
|
||||
long mtype;
|
||||
int mtext[MAX_BSZ * 2 + 2]; // encoder_count, layer_id, bid- pair
|
||||
int mtext[MAX_BSZ * 3 + 2]; // encoder_count, layer_id, bid- pair
|
||||
};
|
Reference in New Issue
Block a user