From 3ab116106fa85c66a45673a7242a0ea8c76b3e3f Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Li=20Yudong=20=28=E6=9D=8E=E7=85=9C=E4=B8=9C=29?= Date: Wed, 25 Oct 2023 18:04:34 +0800 Subject: [PATCH] Update multi_headed_attn.py --- tencentpretrain/layers/multi_headed_attn.py | 1 + 1 file changed, 1 insertion(+) diff --git a/tencentpretrain/layers/multi_headed_attn.py b/tencentpretrain/layers/multi_headed_attn.py index 1f17c75..b8e5dcf 100755 --- a/tencentpretrain/layers/multi_headed_attn.py +++ b/tencentpretrain/layers/multi_headed_attn.py @@ -1,6 +1,7 @@ import math import torch import torch.nn as nn +import torch.nn.functional as F from tencentpretrain.utils.rope import apply_rotary_emb from tencentpretrain.utils.lora import LoraLinear