Skip to content

Commit 0711630

Browse files
fynnsudsikka
andauthored
Replace nm-testing/llama2.c-stories15M with nm-testing/tinysmokellama-3.2 (#1833)
SUMMARY: Created a new [model](https://huggingface.co/nm-testing/tinysmokellama-3.2) based off of a `LLama3.2` model for smoke testing. Note: the model is not properly trained, so outputs shouldn't be used, but the weights come from a real model's distribution "meta-llama/Llama-3.2-1B". TEST PLAN: Ran the "transformers" checks locally + they will be rerun by CI. --------- Signed-off-by: Fynn Schmitt-Ulms <[email protected]> Co-authored-by: Dipika Sikka <[email protected]>
1 parent 27303c4 commit 0711630

30 files changed

+38
-38
lines changed
Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
11
cadence: "commit"
22
test_type: "regression"
3-
model_stub: "nm-testing/llama2.c-stories15M"
3+
model_stub: "nm-testing/tinysmokellama-3.2"
44
new_recipe: "tests/llmcompressor/transformers/compression/recipes/new_quant_channel.yaml"
Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
11
cadence: "commit"
22
test_type: "regression"
3-
model_stub: "nm-testing/llama2.c-stories15M"
3+
model_stub: "nm-testing/tinysmokellama-3.2"
44
new_recipe: "tests/llmcompressor/transformers/compression/recipes/new_quant_fp8.yaml"
Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
11
cadence: "commit"
22
test_type: "regression"
3-
model_stub: "nm-testing/llama2.c-stories15M"
3+
model_stub: "nm-testing/tinysmokellama-3.2"
44
new_recipe: "tests/llmcompressor/transformers/compression/recipes/new_quant_full.yaml"
Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
11
cadence: "commit"
22
test_type: "regression"
3-
model_stub: "nm-testing/llama2.c-stories15M"
3+
model_stub: "nm-testing/tinysmokellama-3.2"
44
new_recipe: "tests/llmcompressor/transformers/compression/recipes/new_quant_weight.yaml"

tests/llmcompressor/transformers/compression/test_compress_tensor_utils.py

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -46,7 +46,7 @@
4646
def test_sparse_model_reload(compressed, config, dtype, tmp_path):
4747
recipe_str = "tests/llmcompressor/transformers/obcq/recipes/test_tiny2.yaml"
4848
expected_sparsity = 0.5
49-
model_path = "nm-testing/llama2.c-stories15M"
49+
model_path = "nm-testing/tinysmokellama-3.2"
5050
dataset = "open_platypus"
5151
concatenate_data = False
5252
num_calibration_samples = 64
@@ -124,7 +124,7 @@ def test_sparse_model_reload(compressed, config, dtype, tmp_path):
124124
def test_dense_model_save(tmp_path, skip_compression_stats, save_compressed):
125125
reset_session()
126126

127-
model_path = "nm-testing/llama2.c-stories15M"
127+
model_path = "nm-testing/tinysmokellama-3.2"
128128
model = AutoModelForCausalLM.from_pretrained(model_path)
129129

130130
inferred_global_sparsity = SparsityConfigMetadata.infer_global_sparsity(model)
@@ -161,7 +161,7 @@ def test_quant_model_reload(format, dtype, tmp_path):
161161
recipe_str = (
162162
"tests/llmcompressor/transformers/compression/recipes/new_quant_simple.yaml"
163163
)
164-
model_path = "nm-testing/llama2.c-stories15M"
164+
model_path = "nm-testing/tinysmokellama-3.2"
165165
device = "cuda:0" if not torch.cuda.is_available() else "cpu"
166166
dataset = "open_platypus"
167167
concatenate_data = False
@@ -244,7 +244,7 @@ def test_quant_model_reload(format, dtype, tmp_path):
244244
],
245245
)
246246
def test_model_reload(offload, torch_dtype, tie_word_embeddings, device, tmp_path):
247-
model_path = "nm-testing/llama2.c-stories15M"
247+
model_path = "nm-testing/tinysmokellama-3.2"
248248
save_path = tmp_path / "save_path"
249249

250250
model = AutoModelForCausalLM.from_pretrained(model_path, torch_dtype=torch_dtype)
@@ -296,7 +296,7 @@ def test_model_reload_gpu(offload, torch_dtype, tie_word_embeddings, device, tmp
296296
)
297297
def test_model_shared_tensors(offload, torch_dtype, tie_word_embeddings, device):
298298
# load model
299-
model_path = "nm-testing/llama2.c-stories15M"
299+
model_path = "nm-testing/tinysmokellama-3.2"
300300
model = AutoModelForCausalLM.from_pretrained(model_path, torch_dtype=torch_dtype)
301301
if offload:
302302
model = dispatch_model(model, {"": device}, force_hooks=True)
@@ -337,7 +337,7 @@ def test_model_shared_tensors_gpu(offload, torch_dtype, tie_word_embeddings, dev
337337
"model_stub, recipe, sparse_format, quant_format",
338338
[
339339
(
340-
"nm-testing/llama2.c-stories15M",
340+
"nm-testing/tinysmokellama-3.2",
341341
"tests/llmcompressor/transformers/compression/recipes/sparse_24_fp8.yaml",
342342
CompressionFormat.sparse_24_bitmask.value,
343343
CompressionFormat.float_quantized.value,
@@ -418,7 +418,7 @@ def test_compressor_stacking(model_stub, recipe, sparse_format, quant_format, tm
418418
"model_stub, recipe, sparse_format",
419419
[
420420
(
421-
"nm-testing/llama2.c-stories15M",
421+
"nm-testing/tinysmokellama-3.2",
422422
"tests/llmcompressor/transformers/compression/recipes/sparse_24.yaml",
423423
CompressionFormat.sparse_24_bitmask.value,
424424
),

tests/llmcompressor/transformers/compression/test_recipe_parsing.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,7 @@ def setup_model_and_config(tmp_path):
1717
Loads a test model and returns common arguments used in oneshot runs.
1818
"""
1919
model = AutoModelForCausalLM.from_pretrained(
20-
"nm-testing/llama2.c-stories15M",
20+
"nm-testing/tinysmokellama-3.2",
2121
torch_dtype="auto",
2222
)
2323

tests/llmcompressor/transformers/finetune/data/conftest.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@
66

77
@pytest.fixture
88
def tiny_llama_path():
9-
return "nm-testing/llama2.c-stories15M"
9+
return "nm-testing/tinysmokellama-3.2"
1010

1111

1212
@pytest.fixture
Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
cadence: "commit"
22
test_type: "sanity"
3-
model: "nm-testing/llama2.c-stories15M"
3+
model: "nm-testing/tinysmokellama-3.2"
44
file_extension: json
55
num_train_epochs: 1
Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
cadence: "commit"
22
test_type: "sanity"
3-
model: "nm-testing/llama2.c-stories15M"
3+
model: "nm-testing/tinysmokellama-3.2"
44
file_extension: csv
55
num_train_epochs: 1
Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
11
cadence: "nightly"
22
test_type: "regression"
3-
model: "nm-testing/llama2.c-stories15M"
3+
model: "nm-testing/tinysmokellama-3.2"
44
dataset: open_platypus

0 commit comments

Comments
 (0)