Fix sampler

2023-02-23 20:30:12 +00:00
parent fdd0f2f472
commit de0fabbc5c
2 changed files with 6 additions and 8 deletions
--- a/cacheflow/models/sample.py
+++ b/cacheflow/models/sample.py
@@ -8,15 +8,12 @@ from cacheflow.models import InputMetadata

 class Sampler(nn.Module):

-    def __init__(
-        self,
-        embedding: torch.Tensor,
-    ) -> None:
+    def __init__(self) -> None:
        super().__init__()
-        self.embedding = embedding  # [vocab_size, hidden_size]

    def forward(
        self,
+        embedding: torch.Tensor,
        hidden_states: torch.Tensor,
        input_metadata: InputMetadata,
    ) -> Dict[int, Tuple[int, int]]:
@@ -31,7 +28,7 @@ class Sampler(nn.Module):
        hidden_states = hidden_states[last_token_indicies]

        # Get the logits for the next tokens.
-        logits = torch.matmul(hidden_states, self.embedding.t())
+        logits = torch.matmul(hidden_states, embedding.t())

        # Sample the next tokens.
        # TODO(woosuk): Implement other sampling methods.