Skip to content

Commit 0176060

Browse files
madamczyk-inteladobrzyn
authored andcommitted
Disable value splitting on G3 (#58)
1 parent 027f5d0 commit 0176060

File tree

1 file changed

+4
-1
lines changed

1 file changed

+4
-1
lines changed

vllm/hpu/ops.py

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -9,11 +9,14 @@
99
import torch.nn as nn
1010
import torch.nn.functional as F
1111
import habana_frameworks.torch as htorch
12+
import habana_frameworks.torch.utils.experimental as htexp
1213
from typing import List, Optional, Tuple
1314

1415
import vllm.hpu.utils as hpu_utils
1516

16-
PA_SPLIT_VALUE = (os.environ.get('PA_SPLIT_VALUE', '1') == '1')
17+
# FIXME: For some reason splitting value causes DFAs on G3. This needs to be debugged
18+
PA_SPLIT_VALUE_DEFAULT = '0' if (htexp._get_device_type() == htexp.synDeviceType.synDeviceGaudi3) else '1'
19+
PA_SPLIT_VALUE = (os.environ.get('PA_SPLIT_VALUE', PA_SPLIT_VALUE_DEFAULT) == '1')
1720

1821

1922
def silu_and_mul(output, input):

0 commit comments

Comments
 (0)