pretrain core 0
Browse files
scripts/pretrain-core-model-0.yaml
CHANGED
|
@@ -64,7 +64,7 @@ train:
|
|
| 64 |
# global_batch_size: 64
|
| 65 |
|
| 66 |
# Number of samples per data-parallel rank (type: int, default: 4)
|
| 67 |
-
micro_batch_size:
|
| 68 |
# micro_batch_size: 4
|
| 69 |
# micro_batch_size: 2
|
| 70 |
# micro_batch_size: 1
|
|
|
|
| 64 |
# global_batch_size: 64
|
| 65 |
|
| 66 |
# Number of samples per data-parallel rank (type: int, default: 4)
|
| 67 |
+
micro_batch_size: 4
|
| 68 |
# micro_batch_size: 4
|
| 69 |
# micro_batch_size: 2
|
| 70 |
# micro_batch_size: 1
|