Skip to content

Commit

Permalink
Revert "Disable value splitting on G3 (#58)" (#74)
Browse files Browse the repository at this point in the history
This reverts commit 47c0c5b.
  • Loading branch information
tzielinski-habana authored Jun 27, 2024
1 parent 2728599 commit 4a45bbf
Showing 1 changed file with 1 addition and 4 deletions.
5 changes: 1 addition & 4 deletions vllm/hpu/ops.py
Original file line number Diff line number Diff line change
Expand Up @@ -9,14 +9,11 @@
import torch.nn as nn
import torch.nn.functional as F
import habana_frameworks.torch as htorch
import habana_frameworks.torch.utils.experimental as htexp
from typing import List, Optional, Tuple

import vllm.hpu.utils as hpu_utils

# FIXME: For some reason splitting value causes DFAs on G3. This needs to be debugged
PA_SPLIT_VALUE_DEFAULT = '0' if (htexp._get_device_type() == htexp.synDeviceType.synDeviceGaudi3) else '1'
PA_SPLIT_VALUE = (os.environ.get('PA_SPLIT_VALUE', PA_SPLIT_VALUE_DEFAULT) == '1')
PA_SPLIT_VALUE = (os.environ.get('PA_SPLIT_VALUE', '1') == '1')


def silu_and_mul(output, input):
Expand Down

0 comments on commit 4a45bbf

Please sign in to comment.