fix vit pe

0bfb2106 · Varuna Jayasiri · 4cf1d74e · 0bfb2106 · 0bfb2106
隐藏空白更改
内联并排

Showing with 4 addition and 4 deletion

labml_nn/transformers/vit/__init__.py labml_nn/transformers/vit/__init__.py +2 -2

labml_nn/transformers/vit/experiment.py labml_nn/transformers/vit/experiment.py +2 -2

未找到文件。
--- a/labml_nn/transformers/vit/__init__.py
+++ b/labml_nn/transformers/vit/__init__.py
@@ -39,7 +39,7 @@ Here's [an experiment](experiment.html) that trains ViT on CIFAR-10.
 This doesn't do very well because it's trained on a small dataset.
 It's a simple experiment that anyone can run and play with ViTs.

-[![View Run](https://img.shields.io/badge/labml-experiment-brightgreen)](https://app.labml.ai/run/8b531d9ce3dc11eb84fc87df6756eb8f)
+[![View Run](https://img.shields.io/badge/labml-experiment-brightgreen)](https://app.labml.ai/run/afdd5332188b11edbdf543360515b595)
 """

 import torch
@@ -114,7 +114,7 @@ class LearnedPositionalEmbeddings(Module):
        * `x` is the patch embeddings of shape `[patches, batch_size, d_model]`
        """
        # Get the positional embeddings for the given patches
-        pe = self.positional_encodings[x.shape[0]]
+        pe = self.positional_encodings[:x.shape[0]]
        # Add to patch embeddings and return
        return x + pe


--- a/labml_nn/transformers/vit/experiment.py
+++ b/labml_nn/transformers/vit/experiment.py
@@ -7,7 +7,7 @@ summary: >

 #  Train a [Vision Transformer (ViT)](index.html) on CIFAR 10

-[![View Run](https://img.shields.io/badge/labml-experiment-brightgreen)](https://app.labml.ai/run/8b531d9ce3dc11eb84fc87df6756eb8f)
+[![View Run](https://img.shields.io/badge/labml-experiment-brightgreen)](https://app.labml.ai/run/afdd5332188b11edbdf543360515b595)
 """

 from labml import experiment
@@ -76,7 +76,7 @@ def main():
        'transformer.d_model': 512,

        # Training epochs and batch size
-        'epochs': 1000,
+        'epochs': 32,
        'train_batch_size': 64,

        # Augment CIFAR 10 images for training