We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent a0117c9 commit adb593aCopy full SHA for adb593a
docs/config.qmd
@@ -510,7 +510,8 @@ train_on_inputs: false
510
# Note that training loss may have an oscillating pattern with this enabled.
511
group_by_length: false
512
513
-# Whether to use gradient checkpointing https://huggingface.co/docs/transformers/v4.18.0/en/performance#gradient-checkpointing
+# Whether to use gradient checkpointing. Available options are: true, false, "offload".
514
+# https://huggingface.co/docs/transformers/v4.18.0/en/performance#gradient-checkpointing
515
gradient_checkpointing: false
516
# additional kwargs to pass to the trainer for gradient checkpointing
517
# gradient_checkpointing_kwargs:
0 commit comments