Skip to content
Open
Show file tree
Hide file tree
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions examples/quantization_attention/README.md
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
TODO, eval from eldar
Original file line number Diff line number Diff line change
@@ -1,10 +1,10 @@
from compressed_tensors.offload import dispatch_model
from compressed_tensors.quantization import QuantizationArgs, QuantizationScheme
from datasets import load_dataset
from transformers import AutoModelForCausalLM, AutoTokenizer

from llmcompressor import oneshot
from llmcompressor.modifiers.quantization import QuantizationModifier
from compressed_tensors.offload import dispatch_model

# Select model and load it.
model_id = "meta-llama/Meta-Llama-3-8B-Instruct"
Expand Down
Loading