Skip to content

Commit 83789af

Browse files
[iree-test-suites] Add data tiling tests for LLAMA 8B (#21832)
-- This commit adds e2e tests for LLAMA 8B via data tiling. Signed-off-by: Abhishek Varma <[email protected]>
1 parent a327b2d commit 83789af

File tree

2 files changed

+61
-0
lines changed

2 files changed

+61
-0
lines changed
Lines changed: 32 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,32 @@
1+
{
2+
"inputs": [
3+
{
4+
"source": "https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/toy_llama_inputs/decode_next_tokens.npy"
5+
},
6+
{
7+
"source": "https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/toy_llama_inputs/decode_seq_lens.npy"
8+
},
9+
{
10+
"source": "https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/toy_llama_inputs/decode_start_positions.npy"
11+
},
12+
{
13+
"source": "https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/toy_llama_inputs/decode_seq_block_ids.npy"
14+
},
15+
{
16+
"source": "https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/toy_llama_inputs/decode_cache_state.npy"
17+
}
18+
],
19+
"device": "hip",
20+
"real_weights": "https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/real_weights.irpa",
21+
"mlir": "https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/8b_f16_random.mlir",
22+
"compiler_flags": [
23+
"--iree-hal-target-device=hip",
24+
"--iree-opt-level=O3",
25+
"--iree-stream-resource-memory-model=discrete",
26+
"--iree-opt-data-tiling=false",
27+
"--iree-dispatch-creation-data-tiling",
28+
"--iree-hip-encoding-layout-resolver=data-tiling",
29+
"--iree-llvmgpu-test-combine-layout-transformation"
30+
],
31+
"run_function": "decode_bs4"
32+
}
Lines changed: 29 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,29 @@
1+
{
2+
"inputs": [
3+
{
4+
"source": "https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/toy_llama_inputs/prefill_token_ids.npy"
5+
},
6+
{
7+
"source": "https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/toy_llama_inputs/prefill_seq_lens.npy"
8+
},
9+
{
10+
"source": "https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/toy_llama_inputs/prefill_seq_block_ids.npy"
11+
},
12+
{
13+
"source": "https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/toy_llama_inputs/prefill_cache_state.npy"
14+
}
15+
],
16+
"device": "hip",
17+
"real_weights": "https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/real_weights.irpa",
18+
"mlir": "https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/8b_f16_random.mlir",
19+
"compiler_flags": [
20+
"--iree-hal-target-device=hip",
21+
"--iree-opt-level=O3",
22+
"--iree-stream-resource-memory-model=discrete",
23+
"--iree-opt-data-tiling=false",
24+
"--iree-dispatch-creation-data-tiling",
25+
"--iree-hip-encoding-layout-resolver=data-tiling",
26+
"--iree-llvmgpu-test-combine-layout-transformation"
27+
],
28+
"run_function": "prefill_bs4"
29+
}

0 commit comments

Comments
 (0)