mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2025-10-05 16:48:03 +08:00
update env docs for Machete (#3959)
This commit is contained in:
@@ -72,5 +72,7 @@ environment_variables: dict[str, Callable[[], Any]] = {
|
|||||||
"FD_USE_DEEP_GEMM":
|
"FD_USE_DEEP_GEMM":
|
||||||
lambda: bool(int(os.getenv("FD_USE_DEEP_GEMM", "0"))),
|
lambda: bool(int(os.getenv("FD_USE_DEEP_GEMM", "0"))),
|
||||||
|
|
||||||
|
# Whether to use Machete for wint4 dense GEMM.
|
||||||
|
"FD_USE_MACHETE": lambda: os.getenv("FD_USE_MACHETE", "0"),
|
||||||
}
|
}
|
||||||
```
|
```
|
||||||
|
@@ -71,5 +71,8 @@ environment_variables: dict[str, Callable[[], Any]] = {
|
|||||||
# 是否使用DeepGemm后端的FP8 blockwise MoE.
|
# 是否使用DeepGemm后端的FP8 blockwise MoE.
|
||||||
"FD_USE_DEEP_GEMM":
|
"FD_USE_DEEP_GEMM":
|
||||||
lambda: bool(int(os.getenv("FD_USE_DEEP_GEMM", "0"))),
|
lambda: bool(int(os.getenv("FD_USE_DEEP_GEMM", "0"))),
|
||||||
|
|
||||||
|
# 是否使用 Machete 后端的 wint4 GEMM.
|
||||||
|
"FD_USE_MACHETE": lambda: os.getenv("FD_USE_MACHETE", "0"),
|
||||||
}
|
}
|
||||||
```
|
```
|
||||||
|
Reference in New Issue
Block a user