Skip to content

Commit

Permalink
Fix falcon 180b oom issue if peft > 0.6.2 (#895)
Browse files Browse the repository at this point in the history
Signed-off-by: Wang, Yi A <[email protected]>
  • Loading branch information
sywangyi committed Apr 18, 2024
1 parent 2df159b commit 8786b75
Show file tree
Hide file tree
Showing 4 changed files with 9 additions and 0 deletions.
2 changes: 2 additions & 0 deletions optimum/habana/transformers/modeling_utils.py
Original file line number Diff line number Diff line change
Expand Up @@ -88,6 +88,7 @@
gaudi_esm_for_protein_folding_forward,
gaudi_esmfolding_trunk_forward,
gaudi_falcon_attention_split_heads,
gaudi_falcon_linear_forward,
gaudi_generate_speech,
gaudi_get_extended_attention_mask,
gaudi_gpt2_block_forward,
Expand Down Expand Up @@ -307,6 +308,7 @@ def adapt_transformers_to_gaudi():
transformers.models.falcon.modeling_falcon.FalconModel = GaudiFalconModel
transformers.models.falcon.modeling_falcon.FalconDecoderLayer = GaudiFalconDecoderLayer
transformers.models.falcon.modeling_falcon.FalconAttention._split_heads = gaudi_falcon_attention_split_heads
transformers.models.falcon.modeling_falcon.FalconLinear.forward = gaudi_falcon_linear_forward

# Optimization for t5 on Gaudi
transformers.models.t5.modeling_t5.T5LayerNorm.forward = gaudi_t5_layernorm_forward
Expand Down
1 change: 1 addition & 0 deletions optimum/habana/transformers/models/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -49,6 +49,7 @@
GaudiFalconMLP,
GaudiFalconModel,
gaudi_falcon_attention_split_heads,
gaudi_falcon_linear_forward,
)
from .gpt2 import GaudiGPT2Attention, GaudiGPT2LMHeadModel, gaudi_gpt2_block_forward, gaudi_gpt2_forward
from .gpt_bigcode import (
Expand Down
1 change: 1 addition & 0 deletions optimum/habana/transformers/models/falcon/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -5,4 +5,5 @@
GaudiFalconMLP,
GaudiFalconModel,
gaudi_falcon_attention_split_heads,
gaudi_falcon_linear_forward,
)
5 changes: 5 additions & 0 deletions optimum/habana/transformers/models/falcon/modeling_falcon.py
Original file line number Diff line number Diff line change
Expand Up @@ -83,6 +83,11 @@ def apply_customized_rope(q, k, cos, sin, position_ids):
return apply_rotary_pos_emb(q, k, cos, sin, position_ids)


def gaudi_falcon_linear_forward(self, input: torch.Tensor) -> torch.Tensor:
hidden_states = F.linear(input, self.weight, bias=self.bias)
return hidden_states


def gaudi_falcon_attention_split_heads(
self, fused_qkv: torch.Tensor
) -> Tuple[torch.Tensor, torch.Tensor, torch.Tensor]:
Expand Down

0 comments on commit 8786b75

Please sign in to comment.