mirror of
https://github.com/RYDE-WORK/Langchain-Chatchat.git
synced 2026-02-06 14:57:44 +08:00
更新多卡部署
This commit is contained in:
parent
84e4981cc1
commit
6590ca32db
@ -44,7 +44,7 @@ def create_model_worker_app(
|
|||||||
gptq_act_order=None,
|
gptq_act_order=None,
|
||||||
gpus=None,
|
gpus=None,
|
||||||
num_gpus=1,
|
num_gpus=1,
|
||||||
max_gpu_memory=None,
|
max_gpu_memory="20GiB",
|
||||||
cpu_offloading=None,
|
cpu_offloading=None,
|
||||||
worker_address=base_url.format(model_worker_port),
|
worker_address=base_url.format(model_worker_port),
|
||||||
controller_address=base_url.format(controller_port),
|
controller_address=base_url.format(controller_port),
|
||||||
|
|||||||
@ -76,6 +76,7 @@ parser.add_argument("--num-gpus", type=int, default=1)
|
|||||||
parser.add_argument(
|
parser.add_argument(
|
||||||
"--max-gpu-memory",
|
"--max-gpu-memory",
|
||||||
type=str,
|
type=str,
|
||||||
|
default="20GiB",
|
||||||
help="The maximum memory per gpu. Use a string like '13Gib'",
|
help="The maximum memory per gpu. Use a string like '13Gib'",
|
||||||
)
|
)
|
||||||
parser.add_argument(
|
parser.add_argument(
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user