We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 027f5d0 commit 0176060Copy full SHA for 0176060
vllm/hpu/ops.py
@@ -9,11 +9,14 @@
9
import torch.nn as nn
10
import torch.nn.functional as F
11
import habana_frameworks.torch as htorch
12
+import habana_frameworks.torch.utils.experimental as htexp
13
from typing import List, Optional, Tuple
14
15
import vllm.hpu.utils as hpu_utils
16
-PA_SPLIT_VALUE = (os.environ.get('PA_SPLIT_VALUE', '1') == '1')
17
+# FIXME: For some reason splitting value causes DFAs on G3. This needs to be debugged
18
+PA_SPLIT_VALUE_DEFAULT = '0' if (htexp._get_device_type() == htexp.synDeviceType.synDeviceGaudi3) else '1'
19
+PA_SPLIT_VALUE = (os.environ.get('PA_SPLIT_VALUE', PA_SPLIT_VALUE_DEFAULT) == '1')
20
21
22
def silu_and_mul(output, input):
0 commit comments