Skip to content

Commit 4934d49

Browse files
authored
Support GPT-NeoX Models without attention biases (#2301)
1 parent 358c328 commit 4934d49

File tree

1 file changed

+3
-0
lines changed

1 file changed

+3
-0
lines changed

vllm/model_executor/models/gpt_neox.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -54,6 +54,7 @@ def __init__(
5454
self.total_num_heads = config.num_attention_heads
5555
self.hidden_size = config.hidden_size
5656
self.head_size = self.hidden_size // self.total_num_heads
57+
self.bias = getattr(config, "attention_bias", True)
5758

5859
tensor_model_parallel_world_size = (
5960
get_tensor_model_parallel_world_size())
@@ -65,11 +66,13 @@ def __init__(
6566
config.hidden_size,
6667
self.head_size,
6768
self.total_num_heads,
69+
bias=self.bias,
6870
linear_method=linear_method,
6971
)
7072
self.dense = RowParallelLinear(
7173
config.hidden_size,
7274
config.hidden_size,
75+
bias=self.bias,
7376
linear_method=linear_method,
7477
)
7578
scaling = self.head_size**-0.5

0 commit comments

Comments
 (0)