diff --git a/examples/sentence-transformers-training/nli/training_nli.py b/examples/sentence-transformers-training/nli/training_nli.py
index 602749a24c..2d051cedea 100644
--- a/examples/sentence-transformers-training/nli/training_nli.py
+++ b/examples/sentence-transformers-training/nli/training_nli.py
@@ -103,6 +103,7 @@ def main():
         warmup_ratio=0.1,
         # fp16=True,  # Set to False if you get an error that your GPU can't run on FP16
         bf16=args.bf16,  # Set to True if you have a GPU that supports BF16
+        # sdp_on_bf16=True, #Set to True for better performance (but this setting can affect accuracy)
         # Optional tracking/debugging parameters:
         evaluation_strategy="steps",
         eval_steps=100,
diff --git a/examples/sentence-transformers-training/nli/training_nli_v2.py b/examples/sentence-transformers-training/nli/training_nli_v2.py
index aca9f6bc4d..f1346990b2 100644
--- a/examples/sentence-transformers-training/nli/training_nli_v2.py
+++ b/examples/sentence-transformers-training/nli/training_nli_v2.py
@@ -81,6 +81,7 @@ def main():
         warmup_ratio=0.1,
         # fp16=True,  # Set to False if you get an error that your GPU can't run on FP16
         # bf16=False,  # Set to True if you have a GPU that supports BF16
+        # sdp_on_bf16=True, #Set to True for better performance (but this setting can affect accuracy)
         batch_sampler=BatchSamplers.NO_DUPLICATES,
         # Optional tracking/debugging parameters:
         evaluation_strategy="steps",
diff --git a/examples/sentence-transformers-training/nli/training_nli_v3.py b/examples/sentence-transformers-training/nli/training_nli_v3.py
index a833569651..384d78c6bc 100644
--- a/examples/sentence-transformers-training/nli/training_nli_v3.py
+++ b/examples/sentence-transformers-training/nli/training_nli_v3.py
@@ -82,6 +82,7 @@ def main():
         warmup_ratio=0.1,
         # fp16=True,  # Set to False if you get an error that your GPU can't run on FP16
         # bf16=False,  # Set to True if you have a GPU that supports BF16
+        # sdp_on_bf16=True, #Set to True for better performance (but this setting can affect accuracy)
         batch_sampler=BatchSamplers.NO_DUPLICATES,
         # Optional tracking/debugging parameters:
         evaluation_strategy="steps",
diff --git a/examples/sentence-transformers-training/paraphrases/training_paraphrases.py b/examples/sentence-transformers-training/paraphrases/training_paraphrases.py
index d31bfd5796..67cb54f12b 100644
--- a/examples/sentence-transformers-training/paraphrases/training_paraphrases.py
+++ b/examples/sentence-transformers-training/paraphrases/training_paraphrases.py
@@ -101,6 +101,7 @@
     warmup_ratio=0.1,
     # fp16=True,  # Set to False if you get an error that your GPU can't run on FP16
     # bf16=False,  # Set to True if you have a GPU that supports BF16
+    # sdp_on_bf16=True, #Set to True for better performance (but this setting can affect accuracy)
     batch_sampler=BatchSamplers.NO_DUPLICATES,  # MultipleNegativesRankingLoss benefits from no duplicate samples in a batch
     # We can use ROUND_ROBIN or PROPORTIONAL - to avoid focusing too much on one dataset, we will
     # use round robin, which samples the same amount of batches from each dataset, until one dataset is empty
diff --git a/examples/sentence-transformers-training/sts/training_stsbenchmark.py b/examples/sentence-transformers-training/sts/training_stsbenchmark.py
index fc5b474f25..4dd0b8884b 100644
--- a/examples/sentence-transformers-training/sts/training_stsbenchmark.py
+++ b/examples/sentence-transformers-training/sts/training_stsbenchmark.py
@@ -100,6 +100,7 @@ def main():
         warmup_ratio=0.1,
         # fp16=True,  # Set to False if you get an error that your GPU can't run on FP16
         bf16=args.bf16,  # Set to True if you have a GPU that supports BF16
+        # sdp_on_bf16=True, #Set to True for better performance (but this setting can affect accuracy)
         # Optional tracking/debugging parameters:
         evaluation_strategy="steps",
         eval_steps=100,
diff --git a/examples/sentence-transformers-training/sts/training_stsbenchmark_continue_training.py b/examples/sentence-transformers-training/sts/training_stsbenchmark_continue_training.py
index 33dfcbdb6f..b537b32c45 100644
--- a/examples/sentence-transformers-training/sts/training_stsbenchmark_continue_training.py
+++ b/examples/sentence-transformers-training/sts/training_stsbenchmark_continue_training.py
@@ -75,6 +75,7 @@ def main():
         warmup_ratio=0.1,
         # fp16=True,  # Set to False if you get an error that your GPU can't run on FP16
         # bf16=False,  # Set to True if you have a GPU that supports BF16
+        # sdp_on_bf16=True, #Set to True for better performance (but this setting can affect accuracy)
         # Optional tracking/debugging parameters:
         evaluation_strategy="steps",
         eval_steps=100,