diff --git a/modules/source/07_attention/attention_dev.py b/modules/source/07_attention/attention_dev.py index 050e5f3e..c877d5ca 100644 --- a/modules/source/07_attention/attention_dev.py +++ b/modules/source/07_attention/attention_dev.py @@ -243,6 +243,8 @@ def scaled_dot_product_attention(Q: Tensor, K: Tensor, V: Tensor, # %% [markdown] """ +## 🔧 DEVELOPMENT + ### 🧪 Test Your Attention Implementation Once you implement the `scaled_dot_product_attention` function above, run this cell to test it: