Skip to content

Commit 638b8dd

Browse files
Fixed linting issues with QAT Notebook
Signed-off-by: Farshad Ghodsian <[email protected]>
1 parent 7a5884c commit 638b8dd

File tree

1 file changed

+12
-3
lines changed

1 file changed

+12
-3
lines changed

examples/llm_qat/notebooks/QAT_QAD_Walkthrough.ipynb

Lines changed: 12 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -145,12 +145,11 @@
145145
},
146146
{
147147
"cell_type": "code",
148-
"execution_count": 3,
148+
"execution_count": null,
149149
"id": "b6af94af-1de6-4cb1-959b-98fb3f4e1932",
150150
"metadata": {},
151151
"outputs": [],
152152
"source": [
153-
"from transformers import AutoConfig\n",
154153
"from trl import ModelConfig\n",
155154
"\n",
156155
"model_args = ModelConfig(\n",
@@ -608,6 +607,8 @@
608607
"metadata": {},
609608
"outputs": [],
610609
"source": [
610+
"%%sh # [run in command line outside notebook]\n",
611+
"\n",
611612
"docker run --rm --ipc=host -it \\\n",
612613
" --ulimit stack=67108864 --ulimit memlock=-1 \\\n",
613614
" --gpus all -p 8000:8000 -e TRTLLM_ENABLE_PDL=1 \\\n",
@@ -640,6 +641,8 @@
640641
"metadata": {},
641642
"outputs": [],
642643
"source": [
644+
"%%sh # [run in TensorRT-LLM container]\n",
645+
"\n",
643646
"git clone https://github.com/NVIDIA/TensorRT-Model-Optimizer.git"
644647
]
645648
},
@@ -658,6 +661,8 @@
658661
"metadata": {},
659662
"outputs": [],
660663
"source": [
664+
"%%sh # [run in TensorRT-LLM container]\n",
665+
"\n",
661666
"cd TensorRT-Model-Optimizer/\n",
662667
"pip install -e ."
663668
]
@@ -679,6 +684,8 @@
679684
},
680685
"outputs": [],
681686
"source": [
687+
"%%sh # [run in TensorRT-LLM container]\n",
688+
"\n",
682689
"# set export path for converted checkpoints. The script saves the converted checkpoint in ${ROOT_SAVE_PATH}/saved_models_${MODEL_FULL_NAME}\n",
683690
"export ROOT_SAVE_PATH=/app/tensorrt_llm\n",
684691
"\n",
@@ -710,6 +717,8 @@
710717
"metadata": {},
711718
"outputs": [],
712719
"source": [
720+
"%%sh # [run in TensorRT-LLM container]\n",
721+
"\n",
713722
"trtllm-serve /app/tensorrt_llm/saved_models_checkpoint-450_nvfp4_hf/ \\\n",
714723
" --max_batch_size 1 --max_num_tokens 1024 \\\n",
715724
" --max_seq_len 4096 --tp_size 8 --pp_size 1 \\\n",
@@ -803,7 +812,7 @@
803812
},
804813
{
805814
"cell_type": "code",
806-
"execution_count": 13,
815+
"execution_count": null,
807816
"id": "fb78741b-30cb-46f2-a292-c5192cbca9ed",
808817
"metadata": {},
809818
"outputs": [

0 commit comments

Comments
 (0)