mpt-7b-8k-chat-gptq / custom_embedding.py
casperhansen's picture
GPTQ quantized MPT model
081aec9
raw
history blame contribute delete
305 Bytes
import torch
import torch.nn as nn
import torch.nn.functional as F
from torch import Tensor
class SharedEmbedding(nn.Embedding):
def forward(self, input: Tensor, unembed: bool=False) -> Tensor:
if unembed:
return F.linear(input, self.weight)
return super().forward(input)