File tree Expand file tree Collapse file tree 2 files changed +61
-0
lines changed
tests/external/iree-test-suites/sharktank_models/quality_tests/llama Expand file tree Collapse file tree 2 files changed +61
-0
lines changed Original file line number Diff line number Diff line change 1+ {
2+ "inputs" : [
3+ {
4+ "source" : " https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/toy_llama_inputs/decode_next_tokens.npy"
5+ },
6+ {
7+ "source" : " https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/toy_llama_inputs/decode_seq_lens.npy"
8+ },
9+ {
10+ "source" : " https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/toy_llama_inputs/decode_start_positions.npy"
11+ },
12+ {
13+ "source" : " https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/toy_llama_inputs/decode_seq_block_ids.npy"
14+ },
15+ {
16+ "source" : " https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/toy_llama_inputs/decode_cache_state.npy"
17+ }
18+ ],
19+ "device" : " hip" ,
20+ "real_weights" : " https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/real_weights.irpa" ,
21+ "mlir" : " https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/8b_f16_random.mlir" ,
22+ "compiler_flags" : [
23+ " --iree-hal-target-device=hip" ,
24+ " --iree-opt-level=O3" ,
25+ " --iree-stream-resource-memory-model=discrete" ,
26+ " --iree-opt-data-tiling=false" ,
27+ " --iree-dispatch-creation-data-tiling" ,
28+ " --iree-hip-encoding-layout-resolver=data-tiling" ,
29+ " --iree-llvmgpu-test-combine-layout-transformation"
30+ ],
31+ "run_function" : " decode_bs4"
32+ }
Original file line number Diff line number Diff line change 1+ {
2+ "inputs" : [
3+ {
4+ "source" : " https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/toy_llama_inputs/prefill_token_ids.npy"
5+ },
6+ {
7+ "source" : " https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/toy_llama_inputs/prefill_seq_lens.npy"
8+ },
9+ {
10+ "source" : " https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/toy_llama_inputs/prefill_seq_block_ids.npy"
11+ },
12+ {
13+ "source" : " https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/toy_llama_inputs/prefill_cache_state.npy"
14+ }
15+ ],
16+ "device" : " hip" ,
17+ "real_weights" : " https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/real_weights.irpa" ,
18+ "mlir" : " https://sharkpublic.blob.core.windows.net/sharkpublic/halo-models/llm-dev/llama3_8b_random/8b_f16_random.mlir" ,
19+ "compiler_flags" : [
20+ " --iree-hal-target-device=hip" ,
21+ " --iree-opt-level=O3" ,
22+ " --iree-stream-resource-memory-model=discrete" ,
23+ " --iree-opt-data-tiling=false" ,
24+ " --iree-dispatch-creation-data-tiling" ,
25+ " --iree-hip-encoding-layout-resolver=data-tiling" ,
26+ " --iree-llvmgpu-test-combine-layout-transformation"
27+ ],
28+ "run_function" : " prefill_bs4"
29+ }
You can’t perform that action at this time.
0 commit comments