Make it easy to profile workers with nsight (#3162)

Co-authored-by: Roger Wang <136131678+ywang96@users.noreply.github.com>
This commit is contained in:
Philipp Moritz
2024-03-03 16:19:13 -08:00
committed by GitHub
parent 996d095c54
commit 17c3103c56
4 changed files with 34 additions and 2 deletions

View File

@@ -26,6 +26,7 @@ def main(args: argparse.Namespace):
enforce_eager=args.enforce_eager,
kv_cache_dtype=args.kv_cache_dtype,
device=args.device,
ray_workers_use_nsight=args.ray_workers_use_nsight,
)
sampling_params = SamplingParams(
@@ -145,5 +146,10 @@ if __name__ == '__main__':
default="cuda",
choices=["cuda"],
help='device type for vLLM execution, supporting CUDA only currently.')
parser.add_argument(
"--ray-workers-use-nsight",
action='store_true',
help="If specified, use nsight to profile ray workers",
)
args = parser.parse_args()
main(args)