Skip to content

Commit f8e1dd0

Browse files
committed
fix ruff
1 parent 5f1ed83 commit f8e1dd0

File tree

2 files changed

+3
-4
lines changed

2 files changed

+3
-4
lines changed

examples/vllm_serve/vllm_serve_fakequant.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -57,9 +57,6 @@
5757
import uvloop
5858
from tqdm import tqdm
5959
from transformers import AutoTokenizer
60-
61-
import modelopt.torch.quantization as mtq
62-
from modelopt.torch.utils.dataset_utils import get_dataset_dataloader
6360
from vllm.distributed.parallel_state import get_pp_group, get_tp_group
6461
from vllm.entrypoints.openai.api_server import run_server
6562
from vllm.entrypoints.openai.cli_args import make_arg_parser
@@ -71,6 +68,9 @@
7168
# from vllm.v1.worker.gpu_model_runner import GPUModelRunner
7269
from vllm.v1.worker.gpu_worker import Worker
7370

71+
import modelopt.torch.quantization as mtq
72+
from modelopt.torch.utils.dataset_utils import get_dataset_dataloader
73+
7474

7575
@contextmanager
7676
def disable_compilation(model):

modelopt/torch/quantization/plugins/vllm.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,6 @@
1818
import importlib
1919

2020
import torch
21-
2221
import vllm.model_executor.layers.fused_moe.layer as vllm_fused_moe_layer
2322
import vllm.model_executor.layers.linear as vllm_linear
2423

0 commit comments

Comments
 (0)