You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
argument("--min_load", help="[NOTE: this field isn't currently used at the workergroup level] minimum floor load in perf units/s (token/s for LLms)", type=float),
2110
2110
argument("--target_util", help="[NOTE: this field isn't currently used at the workergroup level] target capacity utilization (fraction, max 1.0, default 0.9)", type=float),
2111
2111
argument("--cold_mult", help="[NOTE: this field isn't currently used at the workergroup level]cold/stopped instance capacity target as multiple of hot capacity target (default 2.0)", type=float),
2112
+
argument("--cold_workers", help="min number of workers to keep 'cold' for this workergroup", type=int),
argument("--min_load", help="minimum floor load in perf units/s (token/s for LLms)", type=float),
5433
5434
argument("--target_util", help="target capacity utilization (fraction, max 1.0, default 0.9)", type=float),
5434
5435
argument("--cold_mult", help="cold/stopped instance capacity target as multiple of hot capacity target (default 2.5)", type=float),
5436
+
argument("--cold_workers", help="min number of workers to keep 'cold' for this workergroup", type=int),
5435
5437
argument("--test_workers",help="number of workers to create to get an performance estimate for while initializing workergroup (default 3)", type=int),
5436
5438
argument("--gpu_ram", help="estimated GPU RAM req (independent of search string)", type=float),
5437
5439
argument("--template_hash", help="template hash (**Note**: if you use this field, you can skip search_params, as they are automatically inferred from the template)", type=str),
0 commit comments