|
20 | 20 | SSM_MODELS = [
|
21 | 21 | "state-spaces/mamba-130m-hf",
|
22 | 22 | "tiiuae/falcon-mamba-tiny-dev",
|
23 |
| - "mistralai/Mamba-Codestral-7B-v0.1", |
| 23 | + "yujiepan/mamba2-codestral-v0.1-tiny-random", |
24 | 24 | ]
|
25 | 25 |
|
26 | 26 | HYBRID_MODELS = [
|
|
29 | 29 | # "pfnet/plamo-2-1b",
|
30 | 30 | "Zyphra/Zamba2-1.2B-instruct",
|
31 | 31 | "hmellor/tiny-random-BambaForCausalLM",
|
32 |
| - "ibm-ai-platform/Bamba-9B-v1", |
33 |
| - "nvidia/Nemotron-H-8B-Base-8K", |
34 | 32 | "ibm-granite/granite-4.0-tiny-preview",
|
35 | 33 | "tiiuae/Falcon-H1-0.5B-Base",
|
36 | 34 | ]
|
|
40 | 38 | # Mamba2 is buggy for Codestral as it doesn't handle n_groups, so the test
|
41 | 39 | # doesn't compare vLLM output with HF output.
|
42 | 40 | # See https://github.com/huggingface/transformers/pull/35943
|
43 |
| - "mistralai/Mamba-Codestral-7B-v0.1", |
44 |
| - # Note: I'm not seeing the same output from vLLM V0 vs. HF transformers |
45 |
| - # for Nemotron-H-8B; currently only compare vLLM V0 vs. vLLM V1 |
46 |
| - "nvidia/Nemotron-H-8B-Base-8K", |
47 |
| - # NOTE: Currently the test fails due to HF transformers issue fixed in: |
48 |
| - # https://github.com/huggingface/transformers/pull/39033 |
49 |
| - # We will enable vLLM test for Granite after next HF transformers release. |
50 |
| - "ibm-granite/granite-4.0-tiny-preview", |
| 41 | + "yujiepan/mamba2-codestral-v0.1-tiny-random", |
| 42 | + # transformers 4.55 is still producing garbage for this model |
| 43 | + # TODO(tdoublep): follow-up on transformers side |
| 44 | + "ibm-granite/granite-4.0-tiny-preview" |
51 | 45 | ]
|
52 | 46 |
|
53 | 47 | V1_SUPPORTED_MODELS = [
|
54 | 48 | "state-spaces/mamba-130m-hf",
|
55 | 49 | "ai21labs/Jamba-tiny-dev",
|
56 |
| - "mistralai/Mamba-Codestral-7B-v0.1", |
57 |
| - "ibm-ai-platform/Bamba-9B-v1", |
| 50 | + "yujiepan/mamba2-codestral-v0.1-tiny-random", |
58 | 51 | "Zyphra/Zamba2-1.2B-instruct",
|
59 |
| - "nvidia/Nemotron-H-8B-Base-8K", |
| 52 | + "hmellor/tiny-random-BambaForCausalLM", |
60 | 53 | "ibm-granite/granite-4.0-tiny-preview",
|
61 | 54 | "tiiuae/Falcon-H1-0.5B-Base",
|
62 | 55 | ]
|
|
0 commit comments