From 1afba47059c21ea4b1ac14d543bba480a01b7ad6 Mon Sep 17 00:00:00 2001 From: Meng Zhang Date: Tue, 3 Oct 2023 15:52:25 -0700 Subject: [PATCH] feat: allow set num_replicas_per_device for CUDA to increase throughput --- crates/tabby/src/serve/mod.rs | 4 ---- 1 file changed, 4 deletions(-) diff --git a/crates/tabby/src/serve/mod.rs b/crates/tabby/src/serve/mod.rs index 40be980..b1f209b 100644 --- a/crates/tabby/src/serve/mod.rs +++ b/crates/tabby/src/serve/mod.rs @@ -244,10 +244,6 @@ fn fallback() -> routing::MethodRouter { } fn valid_args(args: &ServeArgs) { - if args.device == Device::Cuda && args.num_replicas_per_device != 1 { - fatal!("CUDA device only supports 1 replicas per device"); - } - if args.device == Device::Cpu && (args.device_indices.len() != 1 || args.device_indices[0] != 0) { fatal!("CPU device only supports device indices = [0]");