Language Model From Scratch Pdf | Build Large

class TransformerModel(nn.Module): def __init__(self, vocab_size, embedding_dim, num_heads, hidden_dim, num_layers): super(TransformerModel, self).__init__() self.embedding = nn.Embedding(vocab_size, embedding_dim) self.encoder = nn.TransformerEncoderLayer(d_model=embedding_dim, nhead=num_heads, dim_feedforward=hidden_dim, dropout=0.1) self.decoder = nn.TransformerDecoderLayer(d_model=embedding_dim, nhead=num_heads, dim_feedforward=hidden_dim, dropout=0.1) self.fc = nn.Linear(embedding_dim, vocab_size)