diff --git a/vllm/model_executor/models/aquila.py b/vllm/model_executor/models/aquila.py index 8372da562..889239cdb 100644 --- a/vllm/model_executor/models/aquila.py +++ b/vllm/model_executor/models/aquila.py @@ -20,11 +20,7 @@ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. -"""Inference-only LLaMA model compatible with HuggingFace weights. - -The input of the model is flattened to a 1D tensor of tokens. The model uses -InputMetadata to extract the original 2D shape of the input. -""" +"""Inference-only LLaMA model compatible with HuggingFace weights.""" from typing import Any, Dict, List, Optional, Tuple import torch diff --git a/vllm/model_executor/models/baichuan.py b/vllm/model_executor/models/baichuan.py index 93cbc1a85..61cc2192b 100644 --- a/vllm/model_executor/models/baichuan.py +++ b/vllm/model_executor/models/baichuan.py @@ -17,11 +17,7 @@ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. -"""Inference-only BaiChuan model compatible with HuggingFace weights. - -The input of the model is flattened to a 1D tensor of tokens. The model uses -InputMetadata to extract the original 2D shape of the input. -""" +"""Inference-only BaiChuan model compatible with HuggingFace weights.""" import math from typing import List, Optional, Tuple diff --git a/vllm/model_executor/models/bloom.py b/vllm/model_executor/models/bloom.py index 0eb3fdbb9..99ccd7442 100644 --- a/vllm/model_executor/models/bloom.py +++ b/vllm/model_executor/models/bloom.py @@ -15,11 +15,7 @@ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. -"""Inference-only BLOOM model compatible with HuggingFace weights. - -The input of the model is flattened to a 1D tensor of tokens. The model uses -InputMetadata to extract the original 2D shape of the input. -""" +"""Inference-only BLOOM model compatible with HuggingFace weights.""" import math from typing import List, Optional, Tuple diff --git a/vllm/model_executor/models/chatglm.py b/vllm/model_executor/models/chatglm.py index 2a113a155..db426a942 100644 --- a/vllm/model_executor/models/chatglm.py +++ b/vllm/model_executor/models/chatglm.py @@ -1,11 +1,7 @@ # coding=utf-8 # Adapted from # https://github.com/THUDM/ChatGLM2-6B -"""Inference-only ChatGLM model compatible with THUDM weights. - -The input of the model is flattened to a 1D tensor of tokens. The model uses -InputMetadata to extract the original 2D shape of the input. -""" +"""Inference-only ChatGLM model compatible with THUDM weights.""" from typing import List, Optional, Tuple import torch diff --git a/vllm/model_executor/models/gpt2.py b/vllm/model_executor/models/gpt2.py index 0f9f74d32..5dce59f77 100644 --- a/vllm/model_executor/models/gpt2.py +++ b/vllm/model_executor/models/gpt2.py @@ -16,11 +16,7 @@ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. -"""Inference-only GPT-2 model compatible with HuggingFace weights. - -The input of the model is flattened to a 1D tensor of tokens. The model uses -InputMetadata to extract the original 2D shape of the input. -""" +"""Inference-only GPT-2 model compatible with HuggingFace weights.""" from typing import List, Optional, Tuple import torch diff --git a/vllm/model_executor/models/gpt_bigcode.py b/vllm/model_executor/models/gpt_bigcode.py index 47a5d7711..9b69fc90b 100644 --- a/vllm/model_executor/models/gpt_bigcode.py +++ b/vllm/model_executor/models/gpt_bigcode.py @@ -17,11 +17,7 @@ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. -"""Inference-only GPTBigCode model compatible with HuggingFace weights. - -The input of the model is flattened to a 1D tensor of tokens. The model uses -InputMetadata to extract the original 2D shape of the input. -""" +"""Inference-only GPTBigCode model compatible with HuggingFace weights.""" from typing import List, Optional, Tuple import torch diff --git a/vllm/model_executor/models/gpt_j.py b/vllm/model_executor/models/gpt_j.py index 9093d642a..1f0f7d420 100644 --- a/vllm/model_executor/models/gpt_j.py +++ b/vllm/model_executor/models/gpt_j.py @@ -15,11 +15,7 @@ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. -"""Inference-only GPT-J model compatible with HuggingFace weights. - -The input of the model is flattened to a 1D tensor of tokens. The model uses -InputMetadata to extract the original 2D shape of the input. -""" +"""Inference-only GPT-J model compatible with HuggingFace weights.""" from typing import List, Optional, Tuple import torch diff --git a/vllm/model_executor/models/gpt_neox.py b/vllm/model_executor/models/gpt_neox.py index 8c0667d88..b289ddc51 100644 --- a/vllm/model_executor/models/gpt_neox.py +++ b/vllm/model_executor/models/gpt_neox.py @@ -15,11 +15,7 @@ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. -"""Inference-only GPT-NeoX model compatible with HuggingFace weights. - -The input of the model is flattened to a 1D tensor of tokens. The model uses -InputMetadata to extract the original 2D shape of the input. -""" +"""Inference-only GPT-NeoX model compatible with HuggingFace weights.""" from typing import List, Optional, Tuple import torch diff --git a/vllm/model_executor/models/llama.py b/vllm/model_executor/models/llama.py index c3192e806..8e7344da4 100644 --- a/vllm/model_executor/models/llama.py +++ b/vllm/model_executor/models/llama.py @@ -20,11 +20,7 @@ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. -"""Inference-only LLaMA model compatible with HuggingFace weights. - -The input of the model is flattened to a 1D tensor of tokens. The model uses -InputMetadata to extract the original 2D shape of the input. -""" +"""Inference-only LLaMA model compatible with HuggingFace weights.""" from typing import Any, Dict, List, Optional, Tuple import torch diff --git a/vllm/model_executor/models/mistral.py b/vllm/model_executor/models/mistral.py index 793e25b63..d18572610 100644 --- a/vllm/model_executor/models/mistral.py +++ b/vllm/model_executor/models/mistral.py @@ -20,11 +20,7 @@ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. -"""Inference-only Mistral model compatible with HuggingFace weights. - -The input of the model is flattened to a 1D tensor of tokens. The model uses -InputMetadata to extract the original 2D shape of the input. -""" +"""Inference-only Mistral model compatible with HuggingFace weights.""" from typing import List, Optional, Tuple import torch diff --git a/vllm/model_executor/models/opt.py b/vllm/model_executor/models/opt.py index 4c8ff596b..8d88ccd70 100644 --- a/vllm/model_executor/models/opt.py +++ b/vllm/model_executor/models/opt.py @@ -16,11 +16,7 @@ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. -"""Inference-only OPT model compatible with HuggingFace weights. - -The input of the model is flattened to a 1D tensor of tokens. The model uses -InputMetadata to extract the original 2D shape of the input. -""" +"""Inference-only OPT model compatible with HuggingFace weights.""" from typing import List, Optional, Tuple import torch diff --git a/vllm/model_executor/models/phi_1_5.py b/vllm/model_executor/models/phi_1_5.py index 18cd40f39..7ef614601 100644 --- a/vllm/model_executor/models/phi_1_5.py +++ b/vllm/model_executor/models/phi_1_5.py @@ -34,11 +34,7 @@ # CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, # OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. -"""Inference-only Phi-1.5 model compatible with HuggingFace weights. - -The input of the model is flattened to a 1D tensor of tokens. The model uses -InputMetadata to extract the original 2D shape of the input. -""" +"""Inference-only Phi-1.5 model compatible with HuggingFace weights.""" from typing import List, Optional, Tuple import torch diff --git a/vllm/model_executor/models/qwen.py b/vllm/model_executor/models/qwen.py index ce13cae7e..d581838f6 100644 --- a/vllm/model_executor/models/qwen.py +++ b/vllm/model_executor/models/qwen.py @@ -3,11 +3,7 @@ # https://huggingface.co/Qwen/Qwen-7B/blob/main/modeling_qwen.py # Copyright (c) Alibaba Cloud. # LICENSE: https://huggingface.co/Qwen/Qwen-7B/blob/main/LICENSE -"""Inference-only QWen model compatible with HuggingFace weights. - -The input of the model is flattened to a 1D tensor of tokens. The model uses -InputMetadata to extract the original 2D shape of the input. -""" +"""Inference-only QWen model compatible with HuggingFace weights.""" from typing import Any, Dict, List, Optional, Tuple import torch diff --git a/vllm/model_executor/models/yi.py b/vllm/model_executor/models/yi.py index 8faa106f2..c45713285 100644 --- a/vllm/model_executor/models/yi.py +++ b/vllm/model_executor/models/yi.py @@ -20,11 +20,7 @@ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. -"""Inference-only Yi model (https://01.ai) compatible with HuggingFace weights. - -The input of the model is flattened to a 1D tensor of tokens. The model uses -InputMetadata to extract the original 2D shape of the input. -""" +"""Inference-only Yi model (https://01.ai) compatible with HuggingFace weights.""" from typing import Any, Dict, List, Optional, Tuple import torch