File tree Expand file tree Collapse file tree 2 files changed +3
-4
lines changed
modelopt/torch/quantization/plugins Expand file tree Collapse file tree 2 files changed +3
-4
lines changed Original file line number Diff line number Diff line change 57
57
import uvloop
58
58
from tqdm import tqdm
59
59
from transformers import AutoTokenizer
60
-
61
- import modelopt .torch .quantization as mtq
62
- from modelopt .torch .utils .dataset_utils import get_dataset_dataloader
63
60
from vllm .distributed .parallel_state import get_pp_group , get_tp_group
64
61
from vllm .entrypoints .openai .api_server import run_server
65
62
from vllm .entrypoints .openai .cli_args import make_arg_parser
71
68
# from vllm.v1.worker.gpu_model_runner import GPUModelRunner
72
69
from vllm .v1 .worker .gpu_worker import Worker
73
70
71
+ import modelopt .torch .quantization as mtq
72
+ from modelopt .torch .utils .dataset_utils import get_dataset_dataloader
73
+
74
74
75
75
@contextmanager
76
76
def disable_compilation (model ):
Original file line number Diff line number Diff line change 18
18
import importlib
19
19
20
20
import torch
21
-
22
21
import vllm .model_executor .layers .fused_moe .layer as vllm_fused_moe_layer
23
22
import vllm .model_executor .layers .linear as vllm_linear
24
23
You can’t perform that action at this time.
0 commit comments