mpt-7b-8k-chat-awq / custom_embedding.py
casperhansen's picture
MPT 7B 8K quantized
5c660fe
import torch
import torch.nn as nn
import torch.nn.functional as F
from torch import Tensor
class SharedEmbedding(nn.Embedding):
def forward(self, input: Tensor, unembed: bool=False) -> Tensor:
if unembed:
return F.linear(input, self.weight)
return super().forward(input)