Spaces:

bala1802
/

FRIENDS-GPT

Sleeping

FRIENDS-GPT / block.py

Upload 7 files

dabde41 10 months ago

680 Bytes

	import torch.nn as nn

	from multi_head_attention import MultiHeadAttention
	from feedforward import FeedFoward

	class Block(nn.Module):
	""" Transformer block: communication followed by computation """

	def __init__(self, n_embd, n_head):
	# n_embd: embedding dimension, n_head: the number of heads we'd like
	super().__init__()
	head_size = n_embd // n_head
	self.sa = MultiHeadAttention(n_head, head_size)
	self.ffwd = FeedFoward(n_embd)
	self.ln1 = nn.LayerNorm(n_embd)
	self.ln2 = nn.LayerNorm(n_embd)

	def forward(self, x):
	x = x + self.sa(self.ln1(x))
	x = x + self.ffwd(self.ln2(x))
	return x