Skip to content

Commit

Permalink
Changes based on comments.
Browse files Browse the repository at this point in the history
  • Loading branch information
shawntan committed Sep 5, 2024
1 parent 5a21218 commit 353fbdf
Show file tree
Hide file tree
Showing 2 changed files with 0 additions and 3 deletions.
1 change: 0 additions & 1 deletion tests/models/test_granitemoe.py
Original file line number Diff line number Diff line change
Expand Up @@ -33,7 +33,6 @@ def test_models(
max_tokens: int,
num_logprobs: int,
) -> None:
# TODO(sang): Sliding window should be tested separately.
with hf_runner(model, dtype=dtype) as hf_model:
hf_outputs = hf_model.generate_greedy_logprobs_limit(
example_prompts, max_tokens, num_logprobs)
Expand Down
2 changes: 0 additions & 2 deletions vllm/model_executor/models/granitemoe.py
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,6 @@

import torch
from torch import nn
# from transformers import GraniteMoeConfig
from vllm.transformers_utils.configs.granitemoe import GraniteMoeConfig

from vllm.attention import Attention, AttentionMetadata
Expand All @@ -43,7 +42,6 @@
from vllm.model_executor.layers.vocab_parallel_embedding import (
DEFAULT_VOCAB_PADDING_SIZE, ParallelLMHead, VocabParallelEmbedding)
from vllm.model_executor.sampling_metadata import SamplingMetadata
# from vllm.sequence import IntermediateTensors, SamplerOutput
from vllm.sequence import IntermediateTensors
from vllm.model_executor.layers.sampler import Sampler, SamplerOutput

Expand Down

0 comments on commit 353fbdf

Please sign in to comment.