Embedding

`Embedding`

Bases: Module

Source code in src/transformer/modules/embedding.py

class Embedding(nn.Module):

    def __init__(self, d_model: int, vocab_size: int):
        """Transformer Input Embedding

        Args:
            d_model: the Transformer model dimension
            vocab_size: number of terms in our vocabulary
        """
        super().__init__()
        self.d_model = d_model
        self.vocab_size = vocab_size
        self.embedding = nn.Embedding(vocab_size, d_model)

    def forward(self, x):
        """Embed our tokenized inputs

        Note:
            Following section 3.4 in "Attention is All You Need",
            we multiply the embeddings by the square root of the 
            model's dimension
        """
        return self.embedding(x) * math.sqrt(self.d_model)

`init(d_model, vocab_size)`

Transformer Input Embedding

Parameters:

Name	Type	Description	Default
`d_model`	`int`	the Transformer model dimension	required
`vocab_size`	`int`	number of terms in our vocabulary	required

Source code in src/transformer/modules/embedding.py

def __init__(self, d_model: int, vocab_size: int):
    """Transformer Input Embedding

    Args:
        d_model: the Transformer model dimension
        vocab_size: number of terms in our vocabulary
    """
    super().__init__()
    self.d_model = d_model
    self.vocab_size = vocab_size
    self.embedding = nn.Embedding(vocab_size, d_model)

`forward(x)`

Embed our tokenized inputs

Note

Following section 3.4 in "Attention is All You Need", we multiply the embeddings by the square root of the model's dimension

Source code in src/transformer/modules/embedding.py

def forward(self, x):
    """Embed our tokenized inputs

    Note:
        Following section 3.4 in "Attention is All You Need",
        we multiply the embeddings by the square root of the 
        model's dimension
    """
    return self.embedding(x) * math.sqrt(self.d_model)

Embedding

Embedding

__init__(d_model, vocab_size)

forward(x)

`Embedding`

`init(d_model, vocab_size)`

`forward(x)`