tangledgroup
/

tangled-alpha-0.1-core

Text Generation

Model card Files Files and versions

mtasic85 commited on Feb 24, 2025

Commit

0f5ef2e

·

1 Parent(s): 1c9b116

micro_batch_size: 3

Files changed (1) hide show

scripts/pretrain-core-model.yaml +2 -1

scripts/pretrain-core-model.yaml CHANGED Viewed

@@ -67,7 +67,8 @@ train:
   # global_batch_size: 256
   # Number of samples per data-parallel rank (type: int, default: 4)
-  micro_batch_size: 4
   # micro_batch_size: 2
   # micro_batch_size: 1

   # global_batch_size: 256
   # Number of samples per data-parallel rank (type: int, default: 4)
+  # micro_batch_size: 4
+  micro_batch_size: 3
   # micro_batch_size: 2
   # micro_batch_size: 1