mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-05 16:48:03 +08:00
[v1loader]Reduce EB300B model loading time (#3700)
* speed up eb45 * update
This commit is contained in:
@@ -29,7 +29,6 @@ from safetensors import safe_open
|
||||
from tqdm import tqdm
|
||||
|
||||
from fastdeploy.config import FDConfig
|
||||
from fastdeploy.model_executor.layers.utils import get_tensor
|
||||
from fastdeploy.model_executor.models.tp_utils import (
|
||||
check_tensor_parallel_prerequisites,
|
||||
)
|
||||
@@ -186,8 +185,7 @@ def fast_weights_iterator(safe_tensor_list: list[str]):
|
||||
with fast_safe_open(st_file, framework="np") as f:
|
||||
for name in f.keys():
|
||||
param_slice = f.get_slice(name)
|
||||
paddle_tensor = get_tensor(param_slice)
|
||||
yield name, paddle_tensor
|
||||
yield name, param_slice
|
||||
|
||||
|
||||
def fastsafetensors_weights_iterator(
|
||||
|
Reference in New Issue
Block a user