Add NVIDIA TensorRT Model Optimizer in vLLM documentation (#17561)

2025-05-02 11:36:46 -07:00
parent 3e887d2e0c
commit 182f40ea8b
3 changed files with 90 additions and 1 deletions
--- a/docs/source/features/quantization/index.md
+++ b/docs/source/features/quantization/index.md
@@ -17,6 +17,7 @@ gptqmodel
 int4
 int8
 fp8
+modelopt
 quark
 quantized_kvcache
 torchao